{"id":"https://openalex.org/W3135642434","doi":"https://doi.org/10.1109/tnnls.2021.3057424","title":"Visual Navigation With Multiple Goals Based on Deep Reinforcement Learning","display_name":"Visual Navigation With Multiple Goals Based on Deep Reinforcement Learning","publication_year":2021,"publication_date":"2021-03-05","ids":{"openalex":"https://openalex.org/W3135642434","doi":"https://doi.org/10.1109/tnnls.2021.3057424","mag":"3135642434","pmid":"https://pubmed.ncbi.nlm.nih.gov/33667168"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2021.3057424","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3057424","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000822672","display_name":"Zhenhuan Rao","orcid":null},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhenhuan Rao","raw_affiliation_strings":["School of Control Science and Engineering, Shandong University, Jinan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Control Science and Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103094155","display_name":"Yuechen Wu","orcid":"https://orcid.org/0000-0001-5615-8016"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuechen Wu","raw_affiliation_strings":["School of Control Science and Engineering, Shandong University, Jinan, China"],"raw_orcid":"https://orcid.org/0000-0001-5615-8016","affiliations":[{"raw_affiliation_string":"School of Control Science and Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013695081","display_name":"Zifei Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zifei Yang","raw_affiliation_strings":["School of Control Science and Engineering, Shandong University, Jinan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Control Science and Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100756634","display_name":"Wei Zhang","orcid":"https://orcid.org/0000-0002-4960-3190"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]},{"id":"https://openalex.org/I4210164150","display_name":"Shanghai Center for Brain Science and Brain-Inspired Technology","ror":"https://ror.org/0551a0y31","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210164150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["Institute of Brain and Brain-Inspired Science, Shandong University, Jinan, China","School of Control Science and Engineering, Shandong University, Jinan, China"],"raw_orcid":"https://orcid.org/0000-0002-4960-3190","affiliations":[{"raw_affiliation_string":"Institute of Brain and Brain-Inspired Science, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I4210164150","https://openalex.org/I154099455"]},{"raw_affiliation_string":"School of Control Science and Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023507910","display_name":"Shijian Lu","orcid":"https://orcid.org/0000-0002-6766-2506"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shijian Lu","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-6766-2506","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088357715","display_name":"Weizhi Lu","orcid":"https://orcid.org/0000-0003-3812-7405"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weizhi Lu","raw_affiliation_strings":["School of Control Science and Engineering, Shandong University, Jinan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Control Science and Engineering, Shandong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003217535","display_name":"Zheng-Jun Zha","orcid":"https://orcid.org/0000-0003-2510-8993"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"ZhengJun Zha","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0003-2510-8993","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5000822672"],"corresponding_institution_ids":["https://openalex.org/I154099455"],"apc_list":null,"apc_paid":null,"fwci":3.7865,"has_fulltext":false,"cited_by_count":46,"citation_normalized_percentile":{"value":0.94659794,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"32","issue":"12","first_page":"5445","last_page":"5455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8514906764030457},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.830689549446106},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8041828870773315},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.719895601272583},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.574567973613739},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5687634348869324},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5104657411575317},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4911639392375946},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.40305209159851074},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.367473304271698},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.0739983320236206},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07372215390205383}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8514906764030457},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.830689549446106},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8041828870773315},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.719895601272583},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.574567973613739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5687634348869324},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5104657411575317},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4911639392375946},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40305209159851074},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.367473304271698},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0739983320236206},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07372215390205383},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2021.3057424","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3057424","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:33667168","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33667168","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:dr.ntu.edu.sg:10356/163231","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/163231","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.5299999713897705,"display_name":"Partnerships for the goals"}],"awards":[{"id":"https://openalex.org/G1031521155","display_name":null,"funder_award_id":"U1913204","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G159773815","display_name":null,"funder_award_id":"2018CXGC1503","funder_id":"https://openalex.org/F4320329857","funder_display_name":"Major Scientific and Technological Innovation Project of Shandong Province"},{"id":"https://openalex.org/G3584809445","display_name":null,"funder_award_id":"U19B2038","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4513380382","display_name":null,"funder_award_id":"ZR2020JQ29","funder_id":"https://openalex.org/F4320334121","funder_display_name":"Natural Science Fund for Distinguished Young Scholars of Shandong Province"},{"id":"https://openalex.org/G5593383844","display_name":null,"funder_award_id":"61991411","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5769824899","display_name":null,"funder_award_id":"2018AAA0102504","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329857","display_name":"Major Scientific and Technological Innovation Project of Shandong Province","ror":null},{"id":"https://openalex.org/F4320334121","display_name":"Natural Science Fund for Distinguished Young Scholars of Shandong Province","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W567721252","https://openalex.org/W645436802","https://openalex.org/W1520997877","https://openalex.org/W2029143333","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2201581102","https://openalex.org/W2257979135","https://openalex.org/W2417148288","https://openalex.org/W2510924756","https://openalex.org/W2593841437","https://openalex.org/W2596874484","https://openalex.org/W2605564896","https://openalex.org/W2747623286","https://openalex.org/W2783375473","https://openalex.org/W2791797404","https://openalex.org/W2797527950","https://openalex.org/W2798441115","https://openalex.org/W2800142021","https://openalex.org/W2883972132","https://openalex.org/W2893662673","https://openalex.org/W2897554812","https://openalex.org/W2898436992","https://openalex.org/W2910645997","https://openalex.org/W2944153887","https://openalex.org/W2950300520","https://openalex.org/W2950872548","https://openalex.org/W2952578114","https://openalex.org/W2962887844","https://openalex.org/W2963523627","https://openalex.org/W2963800628","https://openalex.org/W2963946945","https://openalex.org/W2964021598","https://openalex.org/W2964043796","https://openalex.org/W2964393431","https://openalex.org/W2966477753","https://openalex.org/W2972758308","https://openalex.org/W2998415550","https://openalex.org/W3004591935","https://openalex.org/W3012783233","https://openalex.org/W3029795912","https://openalex.org/W4293566037","https://openalex.org/W4294225490","https://openalex.org/W4297789683","https://openalex.org/W4297795161","https://openalex.org/W4300799055","https://openalex.org/W4300971732","https://openalex.org/W6616173779","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6729433768","https://openalex.org/W6729556111","https://openalex.org/W6729788943","https://openalex.org/W6731334075","https://openalex.org/W6740801417","https://openalex.org/W6743367460","https://openalex.org/W6747106673","https://openalex.org/W6747912417","https://openalex.org/W6748848655","https://openalex.org/W6750106230","https://openalex.org/W6750629867","https://openalex.org/W6754629161","https://openalex.org/W6756103505","https://openalex.org/W6764339904"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W3162204513","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W20361778"],"abstract_inverted_index":{"Learning":[0],"to":[1,3,42,59,73,90,97,131,148],"adapt":[2],"a":[4,19],"series":[5],"of":[6,104,115],"different":[7],"goals":[8],"in":[9,34],"visual":[10,26],"navigation":[11,27,111],"is":[12,57,125,186],"challenging.":[13],"In":[14],"this":[15],"work,":[16],"we":[17,37,107],"present":[18,108],"model-embedded":[20],"actor-critic":[21],"architecture":[22],"for":[23],"the":[24,31,43,61,75,83,88,100,105,134,143,151,160,166,170],"multigoal":[25,35,52],"task.":[28],"To":[29],"enhance":[30],"task":[32,119],"cooperation":[33],"learning,":[36],"introduce":[38],"two":[39,116],"new":[40],"designs":[41],"reinforcement":[44],"learning":[45],"scheme:":[46],"inverse":[47],"dynamics":[48],"model":[49,112],"(InvDM)":[50],"and":[51,66,68,86,155],"colearning":[53],"(MgCl).":[54],"Specifically,":[55],"InvDM":[56],"proposed":[58,171],"capture":[60],"navigation-relevant":[62],"association":[63],"between":[64,153],"state":[65,135,154],"goal":[67],"provide":[69],"additional":[70],"training":[71],"signals":[72],"relieve":[74],"sparse":[76],"reward":[77],"issue.":[78],"MgCl":[79],"aims":[80],"at":[81,188],"improving":[82],"sample":[84],"efficiency":[85],"supports":[87],"agent":[89,167],"learn":[91],"from":[92],"unintentional":[93],"positive":[94],"experiences.":[95],"Besides,":[96],"further":[98],"improve":[99],"scene":[101],"generalization":[102,181],"capability":[103],"agent,":[106],"an":[109],"enhanced":[110],"that":[113,165],"consists":[114],"self-supervised":[117],"auxiliary":[118],"modules.":[120],"The":[121,139,183],"first":[122],"module,":[123,146],"which":[124],"named":[126],"path":[127],"closed-loop":[128],"detection,":[129],"helps":[130],"understand":[132],"whether":[133],"has":[136],"been":[137],"experienced.":[138],"second":[140],"one,":[141],"namely":[142],"state-target":[144],"matching":[145],"tries":[147],"figure":[149],"out":[150],"difference":[152],"goal.":[156],"Extensive":[157],"results":[158],"on":[159],"interactive":[161],"platform":[162],"AI2-THOR":[163],"demonstrate":[164],"trained":[168],"with":[169],"method":[172],"converges":[173],"faster":[174],"than":[175],"state-of-the-art":[176],"methods":[177],"while":[178],"owning":[179],"good":[180],"capability.":[182],"video":[184],"demonstration":[185],"available":[187],"https://vsislab.github.io/mgvn.":[189]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
