{"id":"https://openalex.org/W3120006980","doi":"https://doi.org/10.1109/iros47612.2022.9981090","title":"Memory-Augmented Reinforcement Learning for Image-Goal Navigation","display_name":"Memory-Augmented Reinforcement Learning for Image-Goal Navigation","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W3120006980","doi":"https://doi.org/10.1109/iros47612.2022.9981090","mag":"3120006980"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9981090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981090","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2101.05181","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110736215","display_name":"Lina Mezghan","orcid":null},"institutions":[{"id":"https://openalex.org/I106785703","display_name":"Institut polytechnique de Grenoble","ror":"https://ror.org/05sbt2524","country_code":"FR","type":"education","lineage":["https://openalex.org/I106785703","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210101348","display_name":"Centre Inria de l'Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/00n8d6z93","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210101348"]},{"id":"https://openalex.org/I4210149092","display_name":"Laboratoire Jean Kuntzmann","ror":"https://ror.org/04ett5b41","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210149092","https://openalex.org/I899635006","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Lina Mezghan","raw_affiliation_strings":["Meta AI","Univ. Grenoble Alpes, Inria, CNRS, Grenoble INP, LJK, Grenoble, France"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]},{"raw_affiliation_string":"Univ. Grenoble Alpes, Inria, CNRS, Grenoble INP, LJK, Grenoble, France","institution_ids":["https://openalex.org/I106785703","https://openalex.org/I4210149092","https://openalex.org/I4210101348","https://openalex.org/I899635006","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060255128","display_name":"Sainbayar Sukhbaatar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sainbayar Sukhbaatar","raw_affiliation_strings":["Meta AI"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090457109","display_name":"Thibaut Lavril","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thibaut Lavril","raw_affiliation_strings":["Meta AI"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076852664","display_name":"Oleksandr Maksymets","orcid":"https://orcid.org/0000-0003-3515-8839"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oleksandr Maksymets","raw_affiliation_strings":["Meta AI"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014035752","display_name":"Dhruv Batra","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dhruv Batra","raw_affiliation_strings":["Meta AI","Georgia Institute of Technology, Georgia"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]},{"raw_affiliation_string":"Georgia Institute of Technology, Georgia","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035420035","display_name":"Piotr Bojanowski","orcid":"https://orcid.org/0000-0001-8098-5900"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Piotr Bojanowski","raw_affiliation_strings":["Meta AI"],"affiliations":[{"raw_affiliation_string":"Meta AI","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049440980","display_name":"Karteek Alahari","orcid":"https://orcid.org/0000-0002-1838-5936"},"institutions":[{"id":"https://openalex.org/I106785703","display_name":"Institut polytechnique de Grenoble","ror":"https://ror.org/05sbt2524","country_code":"FR","type":"education","lineage":["https://openalex.org/I106785703","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210101348","display_name":"Centre Inria de l'Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/00n8d6z93","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210101348"]},{"id":"https://openalex.org/I4210149092","display_name":"Laboratoire Jean Kuntzmann","ror":"https://ror.org/04ett5b41","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210149092","https://openalex.org/I899635006","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Karteek Alahari","raw_affiliation_strings":["Univ. Grenoble Alpes, Inria, CNRS, Grenoble INP, LJK,Grenoble,France,38000"],"affiliations":[{"raw_affiliation_string":"Univ. Grenoble Alpes, Inria, CNRS, Grenoble INP, LJK,Grenoble,France,38000","institution_ids":["https://openalex.org/I106785703","https://openalex.org/I4210149092","https://openalex.org/I4210101348","https://openalex.org/I899635006","https://openalex.org/I1294671590"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5110736215"],"corresponding_institution_ids":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I4210101348","https://openalex.org/I4210149092","https://openalex.org/I899635006"],"apc_list":null,"apc_paid":null,"fwci":12.7956,"has_fulltext":false,"cited_by_count":48,"citation_normalized_percentile":{"value":0.99437858,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":93,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3316","last_page":"3323"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8020541071891785},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7927823066711426},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6785472631454468},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6429144740104675},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6029749512672424},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.47043392062187195},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4206681549549103},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4059258699417114},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.37311244010925293}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8020541071891785},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7927823066711426},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6785472631454468},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6429144740104675},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6029749512672424},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.47043392062187195},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4206681549549103},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4059258699417114},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37311244010925293},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros47612.2022.9981090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981090","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2101.05181","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2101.05181","pdf_url":"https://arxiv.org/pdf/2101.05181","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2101.05181","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2101.05181","pdf_url":"https://arxiv.org/pdf/2101.05181","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W150468168","https://openalex.org/W1612997784","https://openalex.org/W2142362566","https://openalex.org/W2336416123","https://openalex.org/W2593841437","https://openalex.org/W2594903727","https://openalex.org/W2772545238","https://openalex.org/W2774005037","https://openalex.org/W2777032727","https://openalex.org/W2784853476","https://openalex.org/W2786472725","https://openalex.org/W2810785043","https://openalex.org/W2884565639","https://openalex.org/W2890818510","https://openalex.org/W2895453875","https://openalex.org/W2895915466","https://openalex.org/W2914608873","https://openalex.org/W2918728527","https://openalex.org/W2929928372","https://openalex.org/W2950697717","https://openalex.org/W2950885698","https://openalex.org/W2952791429","https://openalex.org/W2953127211","https://openalex.org/W2962789679","https://openalex.org/W2962812366","https://openalex.org/W2962884155","https://openalex.org/W2962887844","https://openalex.org/W2963403868","https://openalex.org/W2963946945","https://openalex.org/W2963948945","https://openalex.org/W2966217762","https://openalex.org/W2973041989","https://openalex.org/W2983335573","https://openalex.org/W2990881323","https://openalex.org/W3001975179","https://openalex.org/W3004691725","https://openalex.org/W3008611878","https://openalex.org/W3009928773","https://openalex.org/W3011144238","https://openalex.org/W3015246624","https://openalex.org/W3016260815","https://openalex.org/W3021708257","https://openalex.org/W3023640063","https://openalex.org/W3029795912","https://openalex.org/W3034431214","https://openalex.org/W3034728521","https://openalex.org/W3035206957","https://openalex.org/W3036497058","https://openalex.org/W3040041096","https://openalex.org/W3049043369","https://openalex.org/W3083980790","https://openalex.org/W3103648783","https://openalex.org/W3106507514","https://openalex.org/W3107575247","https://openalex.org/W3210395242","https://openalex.org/W4205900130","https://openalex.org/W4288331462","https://openalex.org/W4289147137","https://openalex.org/W4294225490","https://openalex.org/W4297795161","https://openalex.org/W4303697778","https://openalex.org/W4307863552","https://openalex.org/W4320471656","https://openalex.org/W4385245566","https://openalex.org/W6606140090","https://openalex.org/W6731334075","https://openalex.org/W6735003056","https://openalex.org/W6739901393","https://openalex.org/W6746700414","https://openalex.org/W6747585041","https://openalex.org/W6748848655","https://openalex.org/W6750106230","https://openalex.org/W6753516098","https://openalex.org/W6754571906","https://openalex.org/W6754725917","https://openalex.org/W6754957883","https://openalex.org/W6758824984","https://openalex.org/W6764173040","https://openalex.org/W6773029903","https://openalex.org/W6773298664","https://openalex.org/W6774815639","https://openalex.org/W6776559744","https://openalex.org/W6780167394","https://openalex.org/W6780443396"],"related_works":["https://openalex.org/W2081900870","https://openalex.org/W4306904969","https://openalex.org/W3162204513","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W2312145515"],"abstract_inverted_index":{"In":[0],"this":[1,76,109],"work,":[2],"we":[3,49,107],"present":[4],"a":[5,51,55,95],"memory-augmented":[6],"approach":[7,85],"for":[8],"image-goal":[9],"navigation.":[10],"Earlier":[11],"attempts,":[12],"including":[13],"RL-based":[14],"and":[15,58,89],"SLAM-based":[16],"approaches":[17],"have":[18],"either":[19],"shown":[20],"poor":[21],"generalization":[22],"performance,":[23],"or":[24,124],"are":[25],"heavily-reliant":[26],"on":[27,34,101],"pose/depth":[28],"sensors.":[29],"Our":[30,70],"method":[31],"is":[32],"based":[33],"an":[35,41,79],"attention-based":[36],"end-to-end":[37],"model":[38,93],"that":[39,91],"leverages":[40],"episodic":[42],"memory":[43],"to":[44,46,62,118,129],"learn":[45],"navigate.":[47],"First,":[48],"train":[50],"state-embedding":[52],"network":[53],"in":[54,126],"self-supervised":[56],"fashion,":[57],"then":[59],"use":[60],"it":[61],"embed":[63],"previously-visited":[64],"states":[65],"into":[66],"the":[67,99,102],"agent's":[68],"memory.":[69],"navigation":[71],"policy":[72],"takes":[73],"advantage":[74],"of":[75,98],"information":[77,120],"through":[78],"attention":[80],"mechanism.":[81],"We":[82],"validate":[83],"our":[84,92],"with":[86],"extensive":[87],"evaluations,":[88],"show":[90],"establishes":[94],"new":[96],"state":[97],"art":[100],"challenging":[103],"Gibson":[104],"dataset.":[105],"Furthermore,":[106],"achieve":[108],"impressive":[110],"performance":[111],"from":[112],"RGB":[113],"input":[114],"alone,":[115],"without":[116],"access":[117],"additional":[119],"such":[121],"as":[122],"position":[123],"depth,":[125],"stark":[127],"contrast":[128],"related":[130],"work.":[131]},"counts_by_year":[{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":2}],"updated_date":"2026-02-01T03:34:12.195049","created_date":"2021-01-18T00:00:00"}
