{"id":"https://openalex.org/W3091453879","doi":"https://doi.org/10.1109/icra40945.2020.9196785","title":"Learning Resilient Behaviors for Navigation Under Uncertainty","display_name":"Learning Resilient Behaviors for Navigation Under Uncertainty","publication_year":2020,"publication_date":"2020-05-01","ids":{"openalex":"https://openalex.org/W3091453879","doi":"https://doi.org/10.1109/icra40945.2020.9196785","mag":"3091453879"},"language":"en","primary_location":{"id":"doi:10.1109/icra40945.2020.9196785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra40945.2020.9196785","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054924375","display_name":"Tingxiang Fan","orcid":"https://orcid.org/0009-0005-6314-2596"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Tingxiang Fan","raw_affiliation_strings":["University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"University of Hong Kong","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016889301","display_name":"Pinxin Long","orcid":"https://orcid.org/0000-0001-8440-3218"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pinxin Long","raw_affiliation_strings":["Robotics and Auto-Driving Lab, Baidu Research"],"affiliations":[{"raw_affiliation_string":"Robotics and Auto-Driving Lab, Baidu Research","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045303340","display_name":"Wenxi Liu","orcid":"https://orcid.org/0000-0002-3630-6322"},"institutions":[{"id":"https://openalex.org/I80947539","display_name":"Fuzhou University","ror":"https://ror.org/011xvna82","country_code":"CN","type":"education","lineage":["https://openalex.org/I80947539"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxi Liu","raw_affiliation_strings":["Fuzhou University"],"affiliations":[{"raw_affiliation_string":"Fuzhou University","institution_ids":["https://openalex.org/I80947539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076812698","display_name":"Jia Pan","orcid":"https://orcid.org/0000-0001-9003-2054"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jia Pan","raw_affiliation_strings":["University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"University of Hong Kong","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076524203","display_name":"Ruigang Yang","orcid":"https://orcid.org/0000-0001-5296-6307"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruigang Yang","raw_affiliation_strings":["Robotics and Auto-Driving Lab, Baidu Research"],"affiliations":[{"raw_affiliation_string":"Robotics and Auto-Driving Lab, Baidu Research","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004194238","display_name":"Dinesh Manocha","orcid":"https://orcid.org/0000-0001-7047-9801"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dinesh Manocha","raw_affiliation_strings":["University of Maryland, College Park"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5054924375"],"corresponding_institution_ids":["https://openalex.org/I889458895"],"apc_list":null,"apc_paid":null,"fwci":1.9884,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.89246001,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5299","last_page":"5305"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7386854290962219},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6798804402351379},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6299012899398804},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5738442540168762},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.5114204287528992},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4874403774738312},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.45585426688194275},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37864577770233154},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3573806881904602}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7386854290962219},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6798804402351379},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6299012899398804},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5738442540168762},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.5114204287528992},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4874403774738312},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.45585426688194275},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37864577770233154},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3573806881904602},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra40945.2020.9196785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra40945.2020.9196785","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.5600000023841858,"display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W582134693","https://openalex.org/W1522301498","https://openalex.org/W1567512734","https://openalex.org/W1976953317","https://openalex.org/W2020895320","https://openalex.org/W2108677974","https://openalex.org/W2117211893","https://openalex.org/W2145339207","https://openalex.org/W2157331557","https://openalex.org/W2280163991","https://openalex.org/W2320277277","https://openalex.org/W2342840547","https://openalex.org/W2524241275","https://openalex.org/W2586067474","https://openalex.org/W2600383743","https://openalex.org/W2604216058","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2765767940","https://openalex.org/W2781726626","https://openalex.org/W2887927966","https://openalex.org/W2890001928","https://openalex.org/W2912063360","https://openalex.org/W2956805085","https://openalex.org/W2962730596","https://openalex.org/W2962736495","https://openalex.org/W2962907394","https://openalex.org/W2962917939","https://openalex.org/W2963428623","https://openalex.org/W2963722165","https://openalex.org/W2963809389","https://openalex.org/W2963821308","https://openalex.org/W2963938771","https://openalex.org/W2964059111","https://openalex.org/W2964121744","https://openalex.org/W2964319688","https://openalex.org/W2968104655","https://openalex.org/W2968983352","https://openalex.org/W3004264147","https://openalex.org/W3099533866","https://openalex.org/W3101442004","https://openalex.org/W3102961490","https://openalex.org/W4247952382","https://openalex.org/W6617145748","https://openalex.org/W6631190155","https://openalex.org/W6676315081","https://openalex.org/W6695011786","https://openalex.org/W6704559304","https://openalex.org/W6733118196","https://openalex.org/W6735443497","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6752818208","https://openalex.org/W6753624969","https://openalex.org/W6754379355"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2122871747","https://openalex.org/W3114279067"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1],"learning":[2],"has":[3],"great":[4],"potential":[5],"to":[6,55,57,98,111,165],"acquire":[7],"complex,":[8],"adaptive":[9,72,162],"behaviors":[10,51,75,114,156],"for":[11,76,90],"autonomous":[12,35],"agents":[13],"automatically.":[14],"However,":[15],"the":[16,39,43,65,100,116,122,132,143],"underlying":[17],"neural":[18],"network":[19,110,125],"polices":[20],"have":[21],"not":[22],"been":[23],"widely":[24],"deployed":[25],"in":[26,30,78,115,157],"real-world":[27],"applications,":[28],"especially":[29],"these":[31],"safety-critical":[32],"tasks":[33],"(e.g.,":[34],"driving).":[36],"One":[37],"of":[38],"reasons":[40],"is":[41],"that":[42,67,150],"learned":[44],"policy":[45],"cannot":[46],"perform":[47],"flexible":[48],"and":[49,73,103,128,140,160],"resilient":[50,74,113,155],"as":[52],"traditional":[53],"methods":[54],"adapt":[56],"diverse":[58,158],"environments.":[59,119],"In":[60],"this":[61],"paper,":[62],"we":[63,104,130],"consider":[64],"problem":[66],"a":[68,87,106],"mobile":[69],"robot":[70],"learns":[71],"navigating":[77],"unseen":[79],"uncertain":[80],"environments":[81,159],"while":[82],"avoiding":[83],"collisions.":[84],"We":[85],"present":[86,131],"novel":[88,107],"approach":[89,152],"uncertainty-aware":[91,96,108,124],"navigation":[92,109],"by":[93],"introducing":[94],"an":[95],"predictor":[97],"model":[99],"environmental":[101,166],"uncertainty,":[102],"propose":[105],"learn":[112,154],"prior":[117],"unknown":[118],"To":[120],"train":[121],"proposed":[123],"more":[126],"stably":[127],"efficiently,":[129],"temperature":[133],"decay":[134],"training":[135,144],"paradigm,":[136],"which":[137],"balances":[138],"exploration":[139],"exploitation":[141],"during":[142],"process.":[145],"Our":[146],"experimental":[147],"evaluation":[148],"demonstrates":[149],"our":[151],"can":[153],"generate":[161],"trajectories":[163],"according":[164],"uncertainties.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
