{"id":"https://openalex.org/W7161262407","doi":"https://doi.org/10.48550/arxiv.2605.14696","title":"EponaV2: Driving World Model with Comprehensive Future Reasoning","display_name":"EponaV2: Driving World Model with Comprehensive Future Reasoning","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161262407","doi":"https://doi.org/10.48550/arxiv.2605.14696"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.14696","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14696","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.14696","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136259227","display_name":"Jiawei Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jiawei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136225443","display_name":"Zhizhou Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Zhizhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136254813","display_name":"Zhijian Shu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shu, Zhijian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025324377","display_name":"Mingkai Jia","orcid":"https://orcid.org/0000-0003-2100-5305"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Mingkai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136215085","display_name":"Mingxiao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Mingxiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072209031","display_name":"Jia-Wang Bian","orcid":"https://orcid.org/0000-0003-2046-3363"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bian, Jia-Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136273640","display_name":"Qian Zhang","orcid":"https://orcid.org/0009-0004-4339-4115"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Qian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136247528","display_name":"Kaicheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Kaicheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136218050","display_name":"Jin Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Jin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136248189","display_name":"Jian Yang","orcid":"https://orcid.org/0000-0003-4250-1391"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136231601","display_name":"Wei Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.7684000134468079,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.7684000134468079,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.0738999992609024,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.027000000700354576,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.597100019454956},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5968999862670898},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.49889999628067017},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.46380001306533813},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4383000135421753},{"id":"https://openalex.org/keywords/advanced-driver-assistance-systems","display_name":"Advanced driver assistance systems","score":0.4336000084877014}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7067000269889832},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.597100019454956},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5968999862670898},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5742999911308289},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.49889999628067017},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.46380001306533813},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4383000135421753},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.4336000084877014},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.30880001187324524},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2849000096321106},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2842999994754791},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26080000400543213}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.14696","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14696","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.14696","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14696","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.7113197445869446}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Data":[0],"scaling":[1],"plays":[2],"a":[3,86,179],"pivotal":[4],"role":[5],"in":[6,17,76],"the":[7,13,62,133,144,148,154,169,208],"pursuit":[8],"of":[9,64,89,158,172,196,210],"general":[10],"intelligence.":[11],"However,":[12],"prevailing":[14],"perception-planning":[15],"paradigm":[16,88],"autonomous":[18],"driving":[19,39,44,90],"relies":[20],"heavily":[21],"on":[22,55,201],"expensive":[23],"manual":[24],"annotations":[25],"to":[26,61,115,126,141,162,187],"supervise":[27],"trajectory":[28,78,164],"planning,":[29],"which":[30,93,121],"severely":[31],"limits":[32],"its":[33],"scalability.":[34],"Conversely,":[35],"although":[36],"existing":[37],"perception-free":[38,199],"world":[40,91],"models":[41,68,200],"achieve":[42],"impressive":[43],"performance,":[45],"their":[46],"real-world":[47,155],"reasoning":[48,156],"ability":[49],"for":[50],"planning":[51,96,190],"is":[52],"solely":[53],"built":[54],"next":[56],"frame":[57],"image":[58],"forecasting.":[59],"Due":[60],"lack":[63],"enough":[65],"supervision,":[66],"these":[67],"often":[69],"struggle":[70],"with":[71,97],"comprehensive":[72,98,118],"scene":[73],"understanding,":[74],"resulting":[75],"unsatisfactory":[77],"planning.":[79,165],"In":[80],"this":[81],"paper,":[82],"we":[83,111,177],"propose":[84],"EponaV2,":[85,159],"novel":[87],"models,":[92],"achieves":[94],"high-quality":[95],"future":[99,119,127,149],"reasoning.":[100],"Inspired":[101],"by":[102,168],"how":[103],"human":[104],"drivers":[105],"anticipate":[106],"3D":[107,134],"geometry":[108,128],"and":[109,129,135,147],"semantics,":[110],"train":[112],"our":[113,139,211],"model":[114,140],"forecast":[116],"more":[117],"representations,":[120],"can":[122],"be":[123],"additionally":[124],"decoded":[125],"semantic":[130,136],"maps.":[131],"Extracting":[132],"modalities":[137],"enables":[138],"deeply":[142],"understand":[143],"surrounding":[145],"environment,":[146],"prediction":[150],"task":[151],"significantly":[152],"enhances":[153],"capabilities":[157],"ultimately":[160],"leading":[161],"improved":[163],"Moreover,":[166],"inspired":[167],"training":[170],"recipe":[171],"Large":[173],"Language":[174],"Models":[175],"(LLMs),":[176],"introduce":[178],"flow":[180],"matching":[181],"group":[182],"relative":[183],"policy":[184],"optimization":[185],"mechanism":[186],"further":[188],"improve":[189],"accuracy.":[191],"The":[192],"state-of-the-art":[193],"(SOTA)":[194],"performances":[195],"EponaV2":[197],"among":[198],"three":[202],"NAVSIM":[203],"benchmarks":[204],"(+1.3PDMS,":[205],"+5.5EPDMS)":[206],"demonstrate":[207],"effectiveness":[209],"methods.":[212]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-16T00:00:00"}
