{"id":"https://openalex.org/W3188853186","doi":"https://doi.org/10.1109/cacre52464.2021.9501321","title":"Towards Efficient Exploration in Unknown Spaces: A Novel Hierarchical Approach Based on Intrinsic Rewards","display_name":"Towards Efficient Exploration in Unknown Spaces: A Novel Hierarchical Approach Based on Intrinsic Rewards","publication_year":2021,"publication_date":"2021-07-01","ids":{"openalex":"https://openalex.org/W3188853186","doi":"https://doi.org/10.1109/cacre52464.2021.9501321","mag":"3188853186"},"language":"en","primary_location":{"id":"doi:10.1109/cacre52464.2021.9501321","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cacre52464.2021.9501321","pdf_url":null,"source":{"id":"https://openalex.org/S4306498778","display_name":"2021 6th International Conference on Automation, Control and Robotics Engineering (CACRE)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 6th International Conference on Automation, Control and Robotics Engineering (CACRE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032366345","display_name":"Yukai Song","orcid":"https://orcid.org/0000-0003-0634-1941"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yukai Song","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053458494","display_name":"Yue Hu","orcid":"https://orcid.org/0000-0002-8115-7020"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Hu","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018606189","display_name":"Junjie Zeng","orcid":"https://orcid.org/0000-0002-4353-1093"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junjie Zeng","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055922843","display_name":"Cong Hu","orcid":"https://orcid.org/0000-0001-8473-077X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Hu","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064290493","display_name":"Long Qin","orcid":"https://orcid.org/0000-0001-5639-4983"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Long Qin","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100610161","display_name":"Quanjun Yin","orcid":"https://orcid.org/0000-0002-1633-174X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quanjun Yin","raw_affiliation_strings":["College of Systems Engineering National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Systems Engineering National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5032366345"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.2614,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.63248848,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generality","display_name":"Generality","score":0.7491734027862549},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7122851610183716},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6749899387359619},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6248257160186768},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6113722324371338},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5926914811134338},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.46681901812553406},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.43064138293266296},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.41910502314567566},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.374324232339859},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1582021415233612}],"concepts":[{"id":"https://openalex.org/C2780767217","wikidata":"https://www.wikidata.org/wiki/Q5532421","display_name":"Generality","level":2,"score":0.7491734027862549},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7122851610183716},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6749899387359619},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6248257160186768},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6113722324371338},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5926914811134338},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.46681901812553406},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.43064138293266296},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.41910502314567566},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.374324232339859},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1582021415233612},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cacre52464.2021.9501321","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cacre52464.2021.9501321","pdf_url":null,"source":{"id":"https://openalex.org/S4306498778","display_name":"2021 6th International Conference on Automation, Control and Robotics Engineering (CACRE)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 6th International Conference on Automation, Control and Robotics Engineering (CACRE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.699999988079071,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G8493858802","display_name":null,"funder_award_id":"61273300","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W326419249","https://openalex.org/W779494576","https://openalex.org/W2000514530","https://openalex.org/W2062644434","https://openalex.org/W2064675550","https://openalex.org/W2076518796","https://openalex.org/W2107667896","https://openalex.org/W2136980446","https://openalex.org/W2144105913","https://openalex.org/W2160589914","https://openalex.org/W2164424353","https://openalex.org/W2194775991","https://openalex.org/W2335959470","https://openalex.org/W2417786368","https://openalex.org/W2433456020","https://openalex.org/W2556477470","https://openalex.org/W2561776174","https://openalex.org/W2562788852","https://openalex.org/W2596982695","https://openalex.org/W2604373826","https://openalex.org/W2736601468","https://openalex.org/W2751973545","https://openalex.org/W2771342126","https://openalex.org/W2772545238","https://openalex.org/W2779977383","https://openalex.org/W2787236409","https://openalex.org/W2888492136","https://openalex.org/W2890274053","https://openalex.org/W2896457183","https://openalex.org/W2899205164","https://openalex.org/W2910054127","https://openalex.org/W2913318911","https://openalex.org/W2913343212","https://openalex.org/W2914608873","https://openalex.org/W2929928372","https://openalex.org/W2949475445","https://openalex.org/W2953100042","https://openalex.org/W2963126744","https://openalex.org/W2963160877","https://openalex.org/W2963262099","https://openalex.org/W2963276097","https://openalex.org/W2963341956","https://openalex.org/W2963523627","https://openalex.org/W2963790038","https://openalex.org/W2964067469","https://openalex.org/W2966477753","https://openalex.org/W2968968404","https://openalex.org/W2997289589","https://openalex.org/W3009928773","https://openalex.org/W3011144238","https://openalex.org/W3018036994","https://openalex.org/W3034956653","https://openalex.org/W3092161856","https://openalex.org/W3129322645","https://openalex.org/W4255468220","https://openalex.org/W6622487243","https://openalex.org/W6650587873","https://openalex.org/W6683436435","https://openalex.org/W6703271639","https://openalex.org/W6716474083","https://openalex.org/W6717230150","https://openalex.org/W6730153900","https://openalex.org/W6730641667","https://openalex.org/W6735033012","https://openalex.org/W6741002519","https://openalex.org/W6747092830","https://openalex.org/W6755207826","https://openalex.org/W6756303580","https://openalex.org/W6758641611","https://openalex.org/W6775522024","https://openalex.org/W6783582377"],"related_works":["https://openalex.org/W1586189497","https://openalex.org/W4319083788","https://openalex.org/W4205364923","https://openalex.org/W3022038857","https://openalex.org/W1537934887","https://openalex.org/W3212134242","https://openalex.org/W4286795643","https://openalex.org/W2137930210","https://openalex.org/W1591434728","https://openalex.org/W2587229774"],"abstract_inverted_index":{"Exploration":[0],"in":[1,51],"unknown":[2],"environments":[3],"using":[4],"deep":[5],"reinforcement":[6],"learning":[7],"(DRL)":[8],"often":[9],"suffers":[10],"from":[11],"sampling":[12],"inefficiency":[13],"due":[14],"to":[15,64,98],"notoriously":[16],"sparse":[17],"extrinsic":[18],"rewards":[19],"and":[20,31,110,116,134,148,156],"complex":[21],"spatial":[22,33],"structures.":[23],"To":[24],"this":[25],"end,":[26],"we":[27],"present":[28],"a":[29,58,66,80,92,151],"hierarchical":[30],"modular":[32],"exploration":[34,76,146],"model":[35,142],"that":[36,72,139],"integrates":[37],"the":[38,49,55,74,85,89,107,140],"recently":[39],"popular":[40],"concept":[41],"of":[42],"intrinsic":[43,123],"motivation":[44],"(IM).":[45],"The":[46],"approach":[47],"addresses":[48],"problem":[50],"two":[52],"levels.":[53],"On":[54,88],"higher":[56],"level,":[57,91],"DRL":[59,155],"based":[60,105,154],"global":[61],"module":[62],"learns":[63],"determine":[65],"distant":[67],"but":[68],"easily":[69],"reachable":[70],"target":[71,81],"maximizes":[73],"current":[75],"progress,":[77],"once":[78],"such":[79],"is":[82,96],"needed":[83],"by":[84],"local":[86],"controller.":[87],"lower":[90],"classical":[93],"path":[94],"planner":[95],"used":[97],"produce":[99],"locally":[100],"smooth":[101],"movements":[102],"between":[103],"targets":[104],"on":[106,132],"known":[108],"areas":[109],"free":[111],"space":[112],"assumption.":[113],"This":[114],"segmented":[115],"sequential":[117],"decision-making":[118],"paradigm,":[119],"with":[120],"an":[121],"informative":[122],"reward":[124],"signal,":[125],"dramatically":[126],"reduces":[127],"training":[128],"difficulty.":[129],"Experimental":[130],"results":[131],"diverse":[133],"challenging":[135],"2D":[136],"maps":[137],"show":[138],"proposed":[141],"has":[143],"consistently":[144],"better":[145],"efficiency":[147],"generality":[149],"than":[150],"state-of-the-art":[152],"IM":[153],"some":[157],"other":[158],"heuristic":[159],"methods.":[160]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
