{"id":"https://openalex.org/W4383108862","doi":"https://doi.org/10.1109/icra48891.2023.10160371","title":"Adaptive and Explainable Deployment of Navigation Skills via Hierarchical Deep Reinforcement Learning","display_name":"Adaptive and Explainable Deployment of Navigation Skills via Hierarchical Deep Reinforcement Learning","publication_year":2023,"publication_date":"2023-05-29","ids":{"openalex":"https://openalex.org/W4383108862","doi":"https://doi.org/10.1109/icra48891.2023.10160371"},"language":"en","primary_location":{"id":"doi:10.1109/icra48891.2023.10160371","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160371","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078048007","display_name":"Kyowoon Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I48566637","display_name":"Ulsan National Institute of Science and Technology","ror":"https://ror.org/017cjz748","country_code":"KR","type":"education","lineage":["https://openalex.org/I48566637"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Kyowoon Lee","raw_affiliation_strings":["Ulsan National Institute of Science and Technology,Department of Computer Science and Engineering,Ulsan,Republic of Korea","Department of Computer Science and Engineering, Ulsan National Institute of Science and Technology, Ulsan, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Ulsan National Institute of Science and Technology,Department of Computer Science and Engineering,Ulsan,Republic of Korea","institution_ids":["https://openalex.org/I48566637"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Ulsan National Institute of Science and Technology, Ulsan, Republic of Korea","institution_ids":["https://openalex.org/I48566637"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035154514","display_name":"Seongun Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seongun Kim","raw_affiliation_strings":["Graduate School of Artificial Intelligence, Korea Advanced Institute of Science and Technology,Daejeon,Republic of Korea,34141"],"affiliations":[{"raw_affiliation_string":"Graduate School of Artificial Intelligence, Korea Advanced Institute of Science and Technology,Daejeon,Republic of Korea,34141","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052985764","display_name":"Jaesik Choi","orcid":"https://orcid.org/0000-0002-4663-3263"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaesik Choi","raw_affiliation_strings":["Graduate School of Artificial Intelligence, Korea Advanced Institute of Science and Technology,Daejeon,Republic of Korea,34141"],"affiliations":[{"raw_affiliation_string":"Graduate School of Artificial Intelligence, Korea Advanced Institute of Science and Technology,Daejeon,Republic of Korea,34141","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5078048007"],"corresponding_institution_ids":["https://openalex.org/I48566637"],"apc_list":null,"apc_paid":null,"fwci":2.6153,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.91645493,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1673","last_page":"1679"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8891725540161133},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7072773575782776},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.6830431818962097},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5789480805397034},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5270124673843384},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5036274790763855},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.47906407713890076},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3947119116783142},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15469682216644287},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.06811732053756714}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8891725540161133},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7072773575782776},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.6830431818962097},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5789480805397034},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5270124673843384},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5036274790763855},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.47906407713890076},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3947119116783142},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15469682216644287},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.06811732053756714},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra48891.2023.10160371","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160371","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321681","display_name":"Ministry of Trade, Industry and Energy","ror":"https://ror.org/008nkqk13"},{"id":"https://openalex.org/F4320324891","display_name":"Iran Telecommunication Research Center","ror":"https://ror.org/01a3g2z22"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W259433365","https://openalex.org/W567721252","https://openalex.org/W1522301498","https://openalex.org/W1777239053","https://openalex.org/W2105932936","https://openalex.org/W2585807598","https://openalex.org/W2593841437","https://openalex.org/W2616430965","https://openalex.org/W2736601468","https://openalex.org/W2781697231","https://openalex.org/W2781726626","https://openalex.org/W2886638267","https://openalex.org/W2887927966","https://openalex.org/W2909335861","https://openalex.org/W2912063360","https://openalex.org/W2940779895","https://openalex.org/W2962887844","https://openalex.org/W2962907394","https://openalex.org/W2962937819","https://openalex.org/W2963001155","https://openalex.org/W2963614114","https://openalex.org/W2963821308","https://openalex.org/W2984168904","https://openalex.org/W3026389972","https://openalex.org/W3090832832","https://openalex.org/W3129678734","https://openalex.org/W3131482536","https://openalex.org/W3142599250","https://openalex.org/W3196302130","https://openalex.org/W3202169896","https://openalex.org/W3207293238","https://openalex.org/W4200143243","https://openalex.org/W4288029271","https://openalex.org/W4300799055","https://openalex.org/W6616173779","https://openalex.org/W6631190155","https://openalex.org/W6638088447","https://openalex.org/W6737937804","https://openalex.org/W6740801417","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6749808448","https://openalex.org/W6753624969","https://openalex.org/W6758315252","https://openalex.org/W6767226293","https://openalex.org/W6800948542"],"related_works":["https://openalex.org/W96612179","https://openalex.org/W2770234245","https://openalex.org/W2566006169","https://openalex.org/W2987774938","https://openalex.org/W632915154","https://openalex.org/W4229499248","https://openalex.org/W4378874356","https://openalex.org/W2055733372","https://openalex.org/W2369811061","https://openalex.org/W3089997100"],"abstract_inverted_index":{"For":[0],"robotic":[1],"vehicles":[2],"to":[3,14,42,59],"navigate":[4],"robustly":[5],"and":[6,36,67,129,133,143],"safely":[7],"in":[8,45,127],"unseen":[9],"environments,":[10],"it":[11],"is":[12,77],"crucial":[13],"decide":[15],"the":[16,112,118,130,162],"most":[17,22,119],"suitable":[18,120],"navigation":[19,28,65,84,121,141],"policy.":[20],"However,":[21],"existing":[23],"deep":[24],"reinforcement":[25],"learning":[26,81,154],"based":[27],"policies":[29,66,97],"are":[30,40],"trained":[31],"with":[32,86,102],"a":[33,46,57,61,68,82,87,94,103],"hand-engineered":[34],"curriculum":[35],"reward":[37,89,107],"function":[38],"which":[39,115],"difficult":[41],"be":[43],"deployed":[44],"wide":[47,104],"range":[48,105],"of":[49,63,80,96,106,164],"real-world":[50],"scenarios.":[51],"In":[52],"this":[53],"paper,":[54],"we":[55,91],"propose":[56],"framework":[58,155],"learn":[60,93,139],"family":[62,95],"low-level":[64],"high-level":[69,113],"policy":[70,85,114],"for":[71,161],"deploying":[72],"them.":[73,146],"The":[74],"main":[75],"idea":[76],"that,":[78],"instead":[79],"single":[83],"fixed":[88],"function,":[90],"simultaneously":[92],"that":[98,135,150],"exhibit":[99],"different":[100],"behaviors":[101],"functions.":[108],"We":[109,123,147],"then":[110],"train":[111],"adaptively":[116,144],"deploys":[117],"skill.":[122],"evaluate":[124],"our":[125,136,151],"approach":[126],"simulation":[128],"real":[131],"world":[132],"demonstrate":[134],"method":[137],"can":[138],"diverse":[140],"skills":[142],"deploy":[145],"also":[148],"illustrate":[149],"proposed":[152],"hierarchical":[153],"presents":[156],"explainability":[157],"by":[158],"providing":[159],"semantics":[160],"behavior":[163],"an":[165],"autonomous":[166],"agent.":[167]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
