{"id":"https://openalex.org/W7163027704","doi":"https://doi.org/10.48550/arxiv.2605.31476","title":"IDOL: Inverse-Dynamics-Guided Future Prediction for End-to-End Autonomous Driving","display_name":"IDOL: Inverse-Dynamics-Guided Future Prediction for End-to-End Autonomous Driving","publication_year":2026,"publication_date":"2026-05-29","ids":{"openalex":"https://openalex.org/W7163027704","doi":"https://doi.org/10.48550/arxiv.2605.31476"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.31476","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31476","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.31476","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137595740","display_name":"Chenghao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chenghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137548025","display_name":"Timin Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Timin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100417601","display_name":"Dongmei Li","orcid":"https://orcid.org/0000-0001-9140-2483"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Dongmei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9038000106811523,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9038000106811523,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.027799999341368675,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.017500000074505806,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.7139000296592712},{"id":"https://openalex.org/keywords/anticipation","display_name":"Anticipation (artificial intelligence)","score":0.5564000010490417},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.483599990606308},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.46549999713897705},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.42329999804496765},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.4075999855995178},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.3978999853134155},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.3353999853134155},{"id":"https://openalex.org/keywords/chaotic","display_name":"Chaotic","score":0.3222000002861023}],"concepts":[{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.7139000296592712},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6694999933242798},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5618000030517578},{"id":"https://openalex.org/C176777502","wikidata":"https://www.wikidata.org/wiki/Q4774623","display_name":"Anticipation (artificial intelligence)","level":2,"score":0.5564000010490417},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.483599990606308},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.46549999713897705},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.438400000333786},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.4075999855995178},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.3978999853134155},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C2777052490","wikidata":"https://www.wikidata.org/wiki/Q5072826","display_name":"Chaotic","level":2,"score":0.3222000002861023},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.3089999854564667},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.3000999987125397},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C64848388","wikidata":"https://www.wikidata.org/wiki/Q188867","display_name":"Futures studies","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2745000123977661},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C106306483","wikidata":"https://www.wikidata.org/wiki/Q183984","display_name":"Futures contract","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.25440001487731934},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.31476","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31476","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.31476","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31476","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.6476216912269592}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"End-to-end":[0],"autonomous":[1],"driving":[2],"has":[3],"emerged":[4],"as":[5,116],"a":[6,76,135],"compelling":[7],"paradigm":[8,23],"for":[9,104,203],"learning":[10],"planning":[11,45,107,187],"directly":[12],"from":[13,181],"sensor":[14],"observations,":[15],"while":[16],"recent":[17],"world-model-based":[18,105],"approaches":[19],"further":[20,194],"enrich":[21],"this":[22,94],"by":[24,198],"enabling":[25],"explicit":[26],"reasoning":[27,79],"about":[28],"how":[29,161],"the":[30,35,47,68,117,162,175,200,219,229],"scene":[31,63,132,183],"may":[32],"evolve":[33],"in":[34,72,108],"future.":[36],"Yet":[37],"future":[38,62,78,101,121,130,179,215],"prediction":[39,102,122],"alone":[40],"does":[41],"not":[42],"guarantee":[43],"better":[44],"unless":[46],"predicted":[48],"evolution":[49],"can":[50],"be":[51],"converted":[52],"into":[53,185,213],"planning-relevant":[54,156],"trajectory":[55,124,152,202],"updates.":[56],"Many":[57],"current":[58],"methods":[59],"still":[60],"forecast":[61],"states":[64,133],"without":[65],"explicitly":[66],"decoding":[67],"motion":[69,90,157],"implications":[70],"hidden":[71],"state":[73],"transitions.":[74],"As":[75],"result,":[77],"often":[80],"remains":[81],"descriptively":[82],"useful":[83],"but":[84],"only":[85],"weakly":[86],"coupled":[87],"to":[88,145,149,173],"executable":[89],"generation.":[91],"To":[92],"address":[93],"limitation,":[95],"we":[96],"propose":[97],"\\mathbf{IDOL},":[98],"an":[99,141],"inverse-dynamics-guided":[100],"framework":[103],"end-to-end":[106],"latent":[109,131,147,163,214],"BEV":[110,136],"space,":[111],"where":[112],"inverse":[113,142,211],"dynamics":[114,143,212],"serves":[115],"key":[118],"bridge":[119],"between":[120,221],"and":[123,154,224,232],"optimization.":[125],"IDOL":[126,217,238],"first":[127],"predicts":[128],"multiple":[129],"with":[134],"world":[137,164,222],"model,":[138],"then":[139],"applies":[140],"model":[144],"adjacent":[146],"futures":[148],"decode":[150],"transition-aware":[151],"features":[153],"recover":[155],"deltas":[158],"that":[159,237],"explain":[160],"evolves":[165],"over":[166],"time.":[167],"These":[168],"inverse-dynamics-derived":[169],"signals":[170],"are":[171],"used":[172],"optimize":[174],"planned":[176],"trajectory,":[177],"turning":[178],"forecasting":[180],"passive":[182],"anticipation":[184],"actionable":[186],"guidance.":[188],"A":[189],"lightweight":[190],"closed-loop":[191],"refinement":[192],"module":[193],"improves":[195],"long-horizon":[196],"consistency":[197],"reusing":[199],"optimized":[201],"another":[204],"round":[205],"of":[206],"future-aware":[207],"reasoning.":[208],"By":[209],"introducing":[210],"reasoning,":[216],"tightens":[218],"coupling":[220],"modeling":[223],"planning.":[225],"Extensive":[226],"experiments":[227],"on":[228],"NAVSIM":[230,233],"v1":[231],"v2":[234],"benchmarks":[235],"show":[236],"achieves":[239],"state-of-the-art":[240],"performance":[241],"among":[242],"comparable":[243],"methods.":[244]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-06-02T00:00:00"}
