{"id":"https://openalex.org/W7160983811","doi":"https://doi.org/10.48550/arxiv.2605.11596","title":"HorizonDrive: Self-Corrective Autoregressive World Model for Long-horizon Driving Simulation","display_name":"HorizonDrive: Self-Corrective Autoregressive World Model for Long-horizon Driving Simulation","publication_year":2026,"publication_date":"2026-05-12","ids":{"openalex":"https://openalex.org/W7160983811","doi":"https://doi.org/10.48550/arxiv.2605.11596"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.11596","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11596","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.11596","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070983856","display_name":"C.J. Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Conglang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102729249","display_name":"Yifan Zhan","orcid":"https://orcid.org/0009-0002-3565-0508"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhan, Yifan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136047598","display_name":"Qingjie Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Qingjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066305904","display_name":"Zhanpeng Ouyang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ouyang, Zhanpeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136068430","display_name":"Yu Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125400519","display_name":"Zihao Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Zihao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136042615","display_name":"Xiaoyang Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Xiaoyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136079384","display_name":"Weiqiang Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Weiqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136088560","display_name":"Qian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Qian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136028551","display_name":"Zhen Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Zhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136084174","display_name":"Yinqiang Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yinqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136051760","display_name":"Wei Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5113976720","display_name":"Zhengqing Chen","orcid":"https://orcid.org/0000-0001-6150-2563"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zhengqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.16660000383853912,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.16660000383853912,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.1574999988079071,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.1289999932050705,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.7860000133514404},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.6636000275611877},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6462000012397766},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5167999863624573},{"id":"https://openalex.org/keywords/train","display_name":"Train","score":0.4708000123500824},{"id":"https://openalex.org/keywords/bounded-rationality","display_name":"Bounded rationality","score":0.3693999946117401},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.3479999899864197}],"concepts":[{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.7860000133514404},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.6636000275611877},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6462000012397766},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6029000282287598},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5167999863624573},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.4708000123500824},{"id":"https://openalex.org/C58694771","wikidata":"https://www.wikidata.org/wiki/Q814385","display_name":"Bounded rationality","level":2,"score":0.3693999946117401},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.36419999599456787},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.3479999899864197},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.3158000111579895},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3140000104904175},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3000999987125397},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.28209999203681946},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25850000977516174},{"id":"https://openalex.org/C159009313","wikidata":"https://www.wikidata.org/wiki/Q5283159","display_name":"Distributed lag","level":2,"score":0.2522999942302704},{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.11596","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11596","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.11596","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11596","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6328461766242981,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Closed-loop":[0],"driving":[1,12,37,132,234],"simulation":[2],"requires":[3],"real-time":[4,191],"interaction":[5],"beyond":[6],"short":[7],"offline":[8],"clips,":[9],"pushing":[10],"current":[11],"world":[13],"models":[14],"toward":[15],"autoregressive":[16],"(AR)":[17],"rollout.":[18],"Existing":[19],"AR":[20,76,119,131,159,168,197],"distillation":[21],"approaches":[22],"typically":[23],"rely":[24],"on":[25,202],"frame":[26],"sinks":[27],"or":[28],"student-side":[29],"degradation":[30],"training.":[31],"The":[32,86],"former":[33],"transfers":[34],"poorly":[35],"to":[36,39,78,108,143,182,223],"due":[38],"fast":[40],"ego-motion":[41],"and":[42,57,209,213,216,220],"rapid":[43],"scene":[44],"changes,":[45],"while":[46,177,229],"the":[47,52,70,100,110,140,162,224],"latter":[48],"remains":[49,155],"bounded":[50,83,175,200],"by":[51,207,211,218],"teacher's":[53],"single-pass":[54,233],"output":[55],"length":[56],"thus":[58],"provides":[59],"only":[60],"a":[61,91,152,178],"limited":[62],"supervision":[63,81,101,115,173],"horizon.":[64],"A":[65],"natural":[66],"question":[67],"is:":[68],"can":[69],"teacher":[71,93,111,153,164,185],"itself":[72],"be":[73],"extended":[74,166],"via":[75,167],"rollout":[77,136,186,198],"provide":[79],"unbounded-horizon":[80],"at":[82],"memory":[84],"cost?":[85],"key":[87,105],"difficulty":[88],"is":[89,107,122,165],"that":[90,154],"standard":[92],"drifts":[94],"under":[95,174,199],"its":[96,117],"own":[97,118],"predictions,":[98],"contaminating":[99],"it":[102,183],"provides.":[103],"Our":[104],"insight":[106],"make":[109],"rollout-capable,":[112],"ensuring":[113],"reliable":[114],"from":[116,148],"rollouts.":[120,160],"This":[121],"instantiated":[123],"as":[124],"HorizonDrive,":[125],"an":[126],"anti-drifting":[127],"training-and-distillation":[128],"framework":[129],"for":[130,189],"simulation.":[133],"First,":[134],"scheduled":[135],"recovery":[137],"(SRR)":[138],"trains":[139],"base":[141],"model":[142],"reconstruct":[144],"ground-truth":[145],"future":[146],"clips":[147],"prediction-corrupted":[149],"histories,":[150],"yielding":[151],"stable":[156],"across":[157],"long":[158],"Second,":[161],"rollout-capable":[163],"rollout,":[169],"providing":[170],"long-horizon":[171,226],"distribution-matching":[172],"memory,":[176],"short-window":[179],"student":[180],"aligns":[181],"with":[184,232],"DMD":[187],"(TRD)":[188],"efficient":[190],"deployment.":[192],"HorizonDrive":[193,204],"natively":[194],"supports":[195],"minute-scale":[196],"memory;":[201],"nuScenes,":[203],"reduces":[205],"FID":[206],"52%":[208],"FVD":[210],"37%,":[212],"lowers":[214],"ARE":[215],"DTW":[217],"21%":[219],"9%":[221],"relative":[222],"strongest":[225],"streaming":[227],"baselines,":[228],"remaining":[230],"competitive":[231],"video":[235],"generators.":[236]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-14T00:00:00"}
