{"id":"https://openalex.org/W7162541397","doi":"https://doi.org/10.48550/arxiv.2605.26503","title":"Uncertainty-Aware Gaussian Map for Vision-Language Navigation","display_name":"Uncertainty-Aware Gaussian Map for Vision-Language Navigation","publication_year":2026,"publication_date":"2026-05-26","ids":{"openalex":"https://openalex.org/W7162541397","doi":"https://doi.org/10.48550/arxiv.2605.26503"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.26503","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26503","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.26503","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102589918","display_name":"Jianzhe Gao","orcid":"https://orcid.org/0000-0002-0215-5984"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Jianzhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137132732","display_name":"Rui Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137167400","display_name":"Yuxuan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yuxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137190471","display_name":"Tongtong Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Tongtong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137104809","display_name":"Yingxue Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yingxue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024908803","display_name":"Zhanguang Zhang","orcid":"https://orcid.org/0000-0003-1134-045X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhanguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137121905","display_name":"Sida Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Sida","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137085785","display_name":"Yi Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137097137","display_name":"Wenguan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Wenguan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9541000127792358,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9541000127792358,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.0044999998062849045,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.004100000020116568,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.7002000212669373},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5856000185012817},{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.46959999203681946},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.451200008392334},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.43140000104904175},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.412200003862381},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.40779998898506165},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4068000018596649},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.34619998931884766},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.34200000762939453}],"concepts":[{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.7002000212669373},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6029999852180481},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5856000185012817},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5753999948501587},{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.46959999203681946},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.451200008392334},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4320000112056732},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.43140000104904175},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.40779998898506165},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4068000018596649},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3921000063419342},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.34619998931884766},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.34200000762939453},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33730000257492065},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3319000005722046},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.32829999923706055},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.32420000433921814},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.31859999895095825},{"id":"https://openalex.org/C81692654","wikidata":"https://www.wikidata.org/wiki/Q225926","display_name":"Kriging","level":2,"score":0.3158999979496002},{"id":"https://openalex.org/C131042201","wikidata":"https://www.wikidata.org/wiki/Q493198","display_name":"Endocentric and exocentric","level":4,"score":0.3151000142097473},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.3124000132083893},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3093000054359436},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.3037000000476837},{"id":"https://openalex.org/C198942812","wikidata":"https://www.wikidata.org/wiki/Q496618","display_name":"Semantic property","level":2,"score":0.3000999987125397},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C99102927","wikidata":"https://www.wikidata.org/wiki/Q3058184","display_name":"Scale space","level":4,"score":0.29179999232292175},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28299999237060547},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C197654239","wikidata":"https://www.wikidata.org/wiki/Q7430757","display_name":"Scene statistics","level":3,"score":0.2687000036239624},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C2776010242","wikidata":"https://www.wikidata.org/wiki/Q4677575","display_name":"Active perception","level":3,"score":0.2644999921321869},{"id":"https://openalex.org/C7218915","wikidata":"https://www.wikidata.org/wiki/Q1054475","display_name":"Gaussian function","level":3,"score":0.26420000195503235},{"id":"https://openalex.org/C51267290","wikidata":"https://www.wikidata.org/wiki/Q5527848","display_name":"Gaussian random field","level":4,"score":0.2630999982357025},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25380000472068787}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.26503","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26503","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.26503","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26503","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-Language":[0],"Navigation":[1],"(VLN)":[2],"requires":[3],"an":[4],"agent":[5,75],"to":[6,69,121,134,153],"navigate":[7],"3D":[8,86,167],"environments":[9],"following":[10],"natural":[11],"language":[12],"instructions.":[13],"During":[14],"navigation,":[15],"existing":[16],"agents":[17],"commonly":[18],"encounter":[19],"perceptual":[20,53],"uncertainty,":[21],"such":[22,39],"as":[23,173],"insufficient":[24],"evidence":[25],"for":[26],"reliable":[27,179],"grounding":[28],"or":[29],"ambiguity":[30],"in":[31],"interpreting":[32],"spatial":[33],"cues,":[34],"yet":[35],"they":[36],"typically":[37],"ignore":[38],"information":[40],"when":[41],"predicting":[42],"actions.":[43],"In":[44],"this":[45],"work,":[46],"we":[47],"explicitly":[48],"model":[49],"three":[50],"forms":[51],"of":[52,84,102,107,116,150,190],"uncertainty":[54,110,126,140],"(i.e.,":[55],"geometric,":[56],"semantic,":[57],"and":[58,61,99,119,138,175],"appearance":[59,139],"uncertainty)":[60],"integrate":[62],"them":[63,172],"into":[64,160,164],"the":[65,96,103,148,188],"agent's":[66],"observation":[67],"space":[68],"enable":[70],"informed":[71],"decision-making.":[72],"Concretely,":[73],"our":[74,191],"first":[76],"constructs":[77],"a":[78,165],"Semantic":[79],"Gaussian":[80,87,117,131],"Map":[81],"(SGM),":[82],"composed":[83],"differentiable":[85],"primitives":[88],"initialized":[89],"from":[90],"panoramic":[91],"observations,":[92],"that":[93,177],"encodes":[94],"both":[95],"geometric":[97,109],"structure":[98],"semantic":[100,125,132],"content":[101],"environment.":[104],"On":[105],"top":[106],"SGM,":[108,161],"is":[111,127,141],"estimated":[112],"through":[113],"variational":[114],"perturbations":[115],"position":[118],"scale":[120],"assess":[122],"structural":[123],"reliability;":[124],"captured":[128],"by":[129,143],"perturbing":[130],"attributes":[133],"reveal":[135],"ambiguous":[136],"interpretations;":[137],"characterized":[142],"Fisher":[144],"Information,":[145],"which":[146,170],"measures":[147],"sensitivity":[149],"rendered":[151],"observations":[152],"Gaussian-level":[154],"variations.":[155],"These":[156],"uncertainties":[157],"are":[158],"incorporated":[159],"extending":[162],"it":[163],"unified":[166],"Value":[168],"Map,":[169],"grounds":[171],"affordances":[174],"constraints":[176],"support":[178],"navigation.":[180],"Comprehensive":[181],"evaluations":[182],"across":[183],"multiple":[184],"VLN":[185],"benchmarks":[186],"show":[187],"effectiveness":[189],"agent.":[192]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
