{"id":"https://openalex.org/W4399656809","doi":"https://doi.org/10.1109/access.2024.3413864","title":"Visual Hindsight Self-Imitation Learning for Interactive Navigation","display_name":"Visual Hindsight Self-Imitation Learning for Interactive Navigation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4399656809","doi":"https://doi.org/10.1109/access.2024.3413864"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3413864","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3413864","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dx.doi.org/10.1109/access.2024.3413864","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085470105","display_name":"K. M. Kim","orcid":"https://orcid.org/0000-0003-2475-036X"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Kibeom Kim","raw_affiliation_strings":["Interdisciplinary Program in Neuroscience, Seoul National University, Seoul, South Korea","Seoul National University, AIIS"],"raw_orcid":"https://orcid.org/0000-0003-2475-036X","affiliations":[{"raw_affiliation_string":"Interdisciplinary Program in Neuroscience, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University, AIIS","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032369055","display_name":"Moonhoen Lee","orcid":"https://orcid.org/0009-0001-9408-0085"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Moonhoen Lee","raw_affiliation_strings":["AI Institute, Seoul National University (AIIS), Seoul, South Korea","Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","Seoul National University, AIIS"],"raw_orcid":"https://orcid.org/0009-0001-9408-0085","affiliations":[{"raw_affiliation_string":"AI Institute, Seoul National University (AIIS), Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","institution_ids":[]},{"raw_affiliation_string":"Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University, AIIS","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059765806","display_name":"Min Whoo Lee","orcid":"https://orcid.org/0009-0000-6681-1031"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Min Whoo Lee","raw_affiliation_strings":["AI Institute, Seoul National University (AIIS), Seoul, South Korea","Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","Seoul National University, AIIS"],"raw_orcid":"https://orcid.org/0009-0000-6681-1031","affiliations":[{"raw_affiliation_string":"AI Institute, Seoul National University (AIIS), Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","institution_ids":[]},{"raw_affiliation_string":"Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University, AIIS","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044954751","display_name":"Kisung Shin","orcid":"https://orcid.org/0009-0009-3259-4353"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kisung Shin","raw_affiliation_strings":["Interdisciplinary Program in Artificial Intelligence, Seoul National University, Seoul, South Korea","Seoul National University, AIIS"],"raw_orcid":"https://orcid.org/0009-0009-3259-4353","affiliations":[{"raw_affiliation_string":"Interdisciplinary Program in Artificial Intelligence, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University, AIIS","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062963163","display_name":"Minsu Lee","orcid":"https://orcid.org/0000-0002-9601-3863"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Minsu Lee","raw_affiliation_strings":["AI Institute, Seoul National University (AIIS), Seoul, South Korea","Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","Seoul National University"],"raw_orcid":"https://orcid.org/0000-0002-9601-3863","affiliations":[{"raw_affiliation_string":"AI Institute, Seoul National University (AIIS), Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Seoul National University, Seoul, South Korea","institution_ids":[]},{"raw_affiliation_string":"Interdisciplinary Program in Cognitive Science, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050928023","display_name":"Byoung\u2010Tak Zhang","orcid":"https://orcid.org/0000-0001-9890-0389"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Byoung-Tak Zhang","raw_affiliation_strings":["Interdisciplinary Program in Neuroscience, Seoul National University, Seoul, South Korea","Seoul National University, AIIS"],"raw_orcid":"https://orcid.org/0000-0001-9890-0389","affiliations":[{"raw_affiliation_string":"Interdisciplinary Program in Neuroscience, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University, AIIS","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5085470105"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.4635,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.61117278,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"12","issue":null,"first_page":"83796","last_page":"83809"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hindsight-bias","display_name":"Hindsight bias","score":0.96755051612854},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7789459228515625},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.7066277265548706},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5932963490486145},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5452755689620972},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.485113263130188},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4540844261646271},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4272606670856476},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.37648120522499084},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.2983851432800293},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.14100730419158936}],"concepts":[{"id":"https://openalex.org/C10347200","wikidata":"https://www.wikidata.org/wiki/Q1960297","display_name":"Hindsight bias","level":2,"score":0.96755051612854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7789459228515625},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.7066277265548706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5932963490486145},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5452755689620972},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.485113263130188},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4540844261646271},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4272606670856476},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37648120522499084},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2983851432800293},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.14100730419158936},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3413864","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3413864","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:a892640863704a3badbcdddc7ed9bc5c","is_oa":true,"landing_page_url":"https://doaj.org/article/a892640863704a3badbcdddc7ed9bc5c","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 83796-83809 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3413864","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3413864","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G279657158","display_name":null,"funder_award_id":"RS-2024-00358416/10%","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G4266587594","display_name":null,"funder_award_id":"RS-2023-00274280/10%","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G5972345699","display_name":null,"funder_award_id":"RS-2024-00353991-SPARC/20%","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":80,"referenced_works":["https://openalex.org/W2044346275","https://openalex.org/W2158782408","https://openalex.org/W2166302491","https://openalex.org/W2187089797","https://openalex.org/W2604382266","https://openalex.org/W2636355936","https://openalex.org/W2774005037","https://openalex.org/W2783375473","https://openalex.org/W2805805280","https://openalex.org/W2896457183","https://openalex.org/W2948978827","https://openalex.org/W2953127211","https://openalex.org/W2962732398","https://openalex.org/W2962887844","https://openalex.org/W2965672435","https://openalex.org/W3009928773","https://openalex.org/W3029795912","https://openalex.org/W3035624836","https://openalex.org/W3035791417","https://openalex.org/W3040834782","https://openalex.org/W3045068663","https://openalex.org/W3046698617","https://openalex.org/W3094542670","https://openalex.org/W3095029720","https://openalex.org/W3120006980","https://openalex.org/W3120387732","https://openalex.org/W3135286130","https://openalex.org/W3163015603","https://openalex.org/W3163878499","https://openalex.org/W3173760279","https://openalex.org/W3178888730","https://openalex.org/W3184282957","https://openalex.org/W3185291728","https://openalex.org/W3210395242","https://openalex.org/W3212325595","https://openalex.org/W3214032446","https://openalex.org/W4207072548","https://openalex.org/W4214860447","https://openalex.org/W4220967017","https://openalex.org/W4225624902","https://openalex.org/W4285407276","https://openalex.org/W4293566037","https://openalex.org/W4311415873","https://openalex.org/W4312863572","https://openalex.org/W4312876407","https://openalex.org/W4312929500","https://openalex.org/W4362515116","https://openalex.org/W4363671520","https://openalex.org/W4378464995","https://openalex.org/W4384918448","https://openalex.org/W4385486983","https://openalex.org/W4386071636","https://openalex.org/W4386075839","https://openalex.org/W4390041933","https://openalex.org/W6692846177","https://openalex.org/W6718092244","https://openalex.org/W6740801417","https://openalex.org/W6747106673","https://openalex.org/W6747912417","https://openalex.org/W6751275834","https://openalex.org/W6751540476","https://openalex.org/W6755207826","https://openalex.org/W6758315252","https://openalex.org/W6767047803","https://openalex.org/W6767518175","https://openalex.org/W6773029903","https://openalex.org/W6776700526","https://openalex.org/W6779463497","https://openalex.org/W6779513676","https://openalex.org/W6779959965","https://openalex.org/W6780443396","https://openalex.org/W6797967685","https://openalex.org/W6802758768","https://openalex.org/W6810604644","https://openalex.org/W6810738896","https://openalex.org/W6851592950","https://openalex.org/W6851604102","https://openalex.org/W6853110611","https://openalex.org/W6854866820","https://openalex.org/W6860041859"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W3196817267","https://openalex.org/W1976600725"],"abstract_inverted_index":{"Interactive":[0],"visual":[1,29,139],"navigation":[2,140],"tasks,":[3,141],"which":[4,73,92],"involve":[5],"following":[6],"instructions":[7,103],"to":[8,101,113],"reach":[9],"and":[10,78,123,148],"interact":[11],"with":[12],"specific":[13],"targets,":[14],"are":[15,22,93],"challenging":[16],"not":[17],"only":[18],"because":[19,27],"successful":[20,127],"experiences":[21],"very":[23],"rare":[24],"but":[25],"also":[26],"complex":[28],"inputs":[30],"require":[31],"a":[32,65],"substantial":[33],"number":[34],"of":[35,52],"samples.":[36],"Previous":[37],"methods":[38],"for":[39,56],"these":[40,61],"tasks":[41],"often":[42],"rely":[43],"on":[44],"intricately":[45],"designed":[46],"dense":[47],"rewards":[48],"or":[49],"the":[50,89,111],"use":[51],"expensive":[53],"expert":[54],"data":[55],"imitation":[57],"learning.":[58],"To":[59],"tackle":[60],"challenges,":[62],"we":[63],"propose":[64],"novel":[66],"approach,":[67],"Visual":[68],"Hindsight":[69],"Self-Imitation":[70],"Learning":[71],"(VHS),":[72],"enables":[74],"re-labeling":[75,122],"in":[76,137],"vision-based":[77,120],"partially":[79],"observable":[80],"environments":[81],"through":[82],"Prototypical":[83],"Goal":[84],"(PG)":[85],"embedding.":[86],"We":[87],"introduce":[88],"PG":[90],"embeddings,":[91],"derived":[94],"from":[95,125],"experienced":[96],"goal":[97,121],"observations,":[98],"as":[99,104],"opposed":[100],"handling":[102],"word":[105],"embeddings.":[106],"This":[107],"embedding":[108],"technique":[109],"allows":[110],"agent":[112],"visually":[114],"reinterpret":[115],"its":[116,143],"unsuccessful":[117],"attempts,":[118],"enabling":[119],"self-imitation":[124],"enhanced":[126],"experiences.":[128],"Experimental":[129],"results":[130],"show":[131],"that":[132],"VHS":[133],"outperforms":[134],"existing":[135],"techniques":[136],"interactive":[138],"confirming":[142],"superior":[144],"performance,":[145],"sample":[146],"efficiency,":[147],"generalization.":[149]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
