{"id":"https://openalex.org/W7154494037","doi":"https://doi.org/10.48550/arxiv.2604.12486","title":"DeCoNav: Dialog enhanced Long-Horizon Collaborative Vision-Language Navigation","display_name":"DeCoNav: Dialog enhanced Long-Horizon Collaborative Vision-Language Navigation","publication_year":2026,"publication_date":"2026-04-14","ids":{"openalex":"https://openalex.org/W7154494037","doi":"https://doi.org/10.48550/arxiv.2604.12486"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.12486","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12486","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.12486","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133681085","display_name":"Sunyao Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhou, Sunyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133725014","display_name":"Yunzi Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yunzi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124892430","display_name":"Tianhang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Tianhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021234168","display_name":"Xinhai Li","orcid":"https://orcid.org/0000-0003-4514-0149"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xinhai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133648716","display_name":"Guang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Guang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133690065","display_name":"Lizheng Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Lizheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133646890","display_name":"Chenjia Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Chenjia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133676584","display_name":"Xuelong Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xuelong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5133681085"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7807000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7807000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.07069999724626541,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.02370000071823597,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendezvous","display_name":"Rendezvous","score":0.8009999990463257},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7337999939918518},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.7138000130653381},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5723999738693237},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.504800021648407},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4255000054836273},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4016000032424927},{"id":"https://openalex.org/keywords/collaboration","display_name":"Collaboration","score":0.3262999951839447}],"concepts":[{"id":"https://openalex.org/C2779968344","wikidata":"https://www.wikidata.org/wiki/Q3932925","display_name":"Rendezvous","level":3,"score":0.8009999990463257},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7836999893188477},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7337999939918518},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.7138000130653381},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.6103000044822693},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5723999738693237},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.504800021648407},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4255000054836273},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4016000032424927},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35280001163482666},{"id":"https://openalex.org/C559553711","wikidata":"https://www.wikidata.org/wiki/Q1145523","display_name":"Collaboration","level":2,"score":0.3262999951839447},{"id":"https://openalex.org/C190954187","wikidata":"https://www.wikidata.org/wiki/Q5270587","display_name":"Dialog system","level":3,"score":0.31520000100135803},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.31439998745918274},{"id":"https://openalex.org/C189693848","wikidata":"https://www.wikidata.org/wiki/Q6031064","display_name":"Information exchange","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2888000011444092},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C554579003","wikidata":"https://www.wikidata.org/wiki/Q474157","display_name":"Collaborative software","level":2,"score":0.27889999747276306},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2712000012397766},{"id":"https://openalex.org/C138020889","wikidata":"https://www.wikidata.org/wiki/Q2349659","display_name":"Collaborative learning","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.260699987411499}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.12486","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12486","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.12486","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12486","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.4682369828224182,"id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Long-horizon":[0],"collaborative":[1,30],"vision-language":[2],"navigation":[3],"(VLN)":[4],"is":[5,140],"critical":[6],"for":[7,111,177],"multi-robot":[8,36,178],"systems":[9],"to":[10,47,142],"accomplish":[11],"complex":[12],"tasks":[13,156],"beyond":[14],"the":[15,28,163,170],"capability":[16],"of":[17,172],"a":[18,23,38,69,98,125],"single":[19],"agent.":[20],"CoNavBench":[21],"takes":[22],"first":[24,29],"step":[25],"by":[26,167],"introducing":[27],"long-horizon":[31],"VLN":[32],"benchmark":[33],"with":[34,42,105,154],"relay-style":[35],"tasks,":[37],"collaboration":[39],"taxonomy,":[40],"along":[41],"graph-grounded":[43],"generation":[44],"and":[45,50,58,73,109,146],"evaluation":[46],"model":[48],"handoffs":[49],"rendezvous":[51],"in":[52,152],"shared":[53,70],"environments.":[54],"However,":[55],"existing":[56],"benchmarks":[57],"evaluations":[59],"often":[60],"do":[61],"not":[62],"enforce":[63],"strictly":[64],"synchronized":[65,149],"dual-robot":[66],"rollout":[67],"on":[68,77],"world":[71],"timeline,":[72],"they":[74],"typically":[75],"rely":[76],"static":[78],"coordination":[79],"policies":[80],"that":[81,101],"cannot":[82],"adapt":[83],"when":[84],"new":[85,133],"cross-agent":[86],"evidence":[87],"emerges.":[88],"We":[89],"present":[90],"Dialog":[91],"enhanced":[92],"Long-Horizon":[93],"Collaborative":[94],"Vision-Language":[95],"Navigation":[96],"(DeCoNav),":[97],"decentralized":[99],"framework":[100],"couples":[102],"event-triggered":[103],"dialogue":[104,123,139],"dynamic":[106],"task":[107],"allocation":[108],"replanning":[110],"real-time,":[112],"adaptive":[113],"coordination.":[114],"In":[115],"DeCoNav,":[116],"robots":[117],"exchange":[118],"compact":[119],"semantic":[120],"states":[121],"via":[122],"without":[124],"central":[126],"controller.":[127],"When":[128],"informative":[129],"events":[130],"such":[131],"as":[132],"evidence,":[134],"uncertainty,":[135],"or":[136],"conflicts":[137],"arise,":[138],"triggered":[141],"dynamically":[143,174],"reassign":[144],"subgoals":[145],"replan":[147],"under":[148],"execution.":[150],"Implemented":[151],"DeCoNavBench":[153],"1,213":[155],"across":[157],"176":[158],"HM3D":[159],"scenes,":[160],"DeCoNav":[161],"improves":[162],"both-success":[164],"rate":[165],"(BSR)":[166],"69.2%,":[168],"demonstrating":[169],"effectiveness":[171],"dialogue-driven,":[173],"reallocated":[175],"planning":[176],"collaboration.":[179]},"counts_by_year":[],"updated_date":"2026-04-16T06:09:31.884825","created_date":"2026-04-16T00:00:00"}
