{"id":"https://openalex.org/W7138169561","doi":"https://doi.org/10.48550/arxiv.2603.14807","title":"HiMemVLN: Enhancing Reliability of Open-Source Zero-Shot Vision-and-Language Navigation with Hierarchical Memory System","display_name":"HiMemVLN: Enhancing Reliability of Open-Source Zero-Shot Vision-and-Language Navigation with Hierarchical Memory System","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138169561","doi":"https://doi.org/10.48550/arxiv.2603.14807"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.14807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.14807","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110962115","display_name":"Kailin Lyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lyu, Kailin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034105691","display_name":"Kangyi Wu","orcid":"https://orcid.org/0000-0001-7382-4949"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Kangyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048567115","display_name":"Pengna Li","orcid":"https://orcid.org/0000-0002-8477-8340"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Pengna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129742011","display_name":"Xiuyu Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xiuyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129675547","display_name":"Qingyi Si","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Si, Qingyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076709764","display_name":"Cui Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miao, Cui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129736668","display_name":"Ning Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Ning","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129682891","display_name":"Zihang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zihang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129717725","display_name":"Long Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Long","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129751356","display_name":"Lianyu Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Lianyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129676960","display_name":"Jingyuan Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Jingyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129725051","display_name":"Ce Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Ce","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.004100000020116568,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.0017999999690800905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5932999849319458},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.5335999727249146},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4253000020980835},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.3952000141143799},{"id":"https://openalex.org/keywords/navigation-system","display_name":"Navigation system","score":0.3935999870300293},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.3073999881744385}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6560999751091003},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5932999849319458},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.5335999727249146},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4253000020980835},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3952000141143799},{"id":"https://openalex.org/C2777891301","wikidata":"https://www.wikidata.org/wiki/Q3475123","display_name":"Navigation system","level":2,"score":0.3935999870300293},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3321000039577484},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3077000081539154},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.30709999799728394},{"id":"https://openalex.org/C2778615406","wikidata":"https://www.wikidata.org/wiki/Q11072","display_name":"Amnesia","level":2,"score":0.2921000123023987},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.25360000133514404},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.14807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.14807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LLM-based":[0],"agents":[1],"have":[2,38],"demonstrated":[3],"impressive":[4],"zero-shot":[5,14],"performance":[6,146],"in":[7,133],"vision-language":[8],"navigation":[9,79,85,129],"(VLN)":[10],"tasks.":[11],"However,":[12],"most":[13],"methods":[15],"primarily":[16],"rely":[17],"on":[18],"closed-source":[19,61,94],"LLMs":[20,46],"as":[21],"navigators,":[22],"which":[23,102],"face":[24],"challenges":[25],"related":[26],"to":[27,40,60,84,113],"high":[28],"token":[29],"costs":[30],"and":[31,87,93,118,125,136],"potential":[32],"data":[33],"leakage":[34],"risks.":[35],"Recent":[36],"efforts":[37],"attempted":[39],"address":[41,97],"this":[42,64],"by":[43],"using":[44],"open-source":[45,92,149],"combined":[47],"with":[48],"a":[49,68,74,104,109],"spatiotemporal":[50],"CoT":[51],"framework,":[52],"but":[53],"they":[54],"still":[55],"fall":[56],"far":[57],"short":[58],"compared":[59],"models.":[62],"In":[63],"work,":[65],"we":[66,99],"identify":[67],"critical":[69],"issue,":[70],"Navigation":[71],"Amnesia,":[72],"through":[73],"detailed":[75],"analysis":[76],"of":[77,147],"the":[78,89,122,127,145,148],"process.":[80],"This":[81],"issue":[82,124],"leads":[83],"failures":[86],"amplifies":[88],"gap":[90],"between":[91],"methods.":[95],"To":[96],"this,":[98],"propose":[100],"HiMemVLN,":[101],"incorporates":[103],"Hierarchical":[105],"Memory":[106],"System":[107],"into":[108],"multimodal":[110],"large":[111],"model":[112],"enhance":[114],"visual":[115],"perception":[116],"recall":[117],"long-term":[119],"localization,":[120],"mitigating":[121],"amnesia":[123],"improving":[126],"agent's":[128],"performance.":[130],"Extensive":[131],"experiments":[132],"both":[134],"simulated":[135],"real-world":[137],"environments":[138],"demonstrate":[139],"that":[140],"HiMemVLN":[141],"achieves":[142],"nearly":[143],"twice":[144],"state-of-the-art":[150],"method.":[151],"The":[152],"code":[153],"is":[154],"available":[155],"at":[156],"https://github.com/lvkailin0118/HiMemVLN.":[157]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-18T00:00:00"}
