{"id":"https://openalex.org/W7137899647","doi":"https://doi.org/10.48550/arxiv.2603.14938","title":"FAR-Drive: Frame-AutoRegressive Video Generation in Closed-Loop Autonomous Driving","display_name":"FAR-Drive: Frame-AutoRegressive Video Generation in Closed-Loop Autonomous Driving","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7137899647","doi":"https://doi.org/10.48550/arxiv.2603.14938"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.14938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.14938","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033443799","display_name":"Y. Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yaoru","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045245623","display_name":"Federico Landi","orcid":"https://orcid.org/0000-0003-2092-1934"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Landi, Federico","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010208045","display_name":"Marco Godi","orcid":"https://orcid.org/0000-0002-8501-6524"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Godi, Marco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129733365","display_name":"Xin Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129701544","display_name":"Ruiju Fu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Ruiju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129687602","display_name":"Yufei Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yufei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027481590","display_name":"Muyang Sun","orcid":"https://orcid.org/0009-0009-8560-8819"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Muyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129711478","display_name":"Heyu Si","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Si, Heyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129678883","display_name":"Qi Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5033443799"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.013000000268220901,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.010400000028312206,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7099000215530396},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6481000185012817},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.6269999742507935},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5623000264167786},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.40529999136924744},{"id":"https://openalex.org/keywords/on-the-fly","display_name":"On the fly","score":0.3330000042915344}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7099000215530396},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7013000249862671},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6481000185012817},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.6269999742507935},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5623000264167786},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.40529999136924744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38670000433921814},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3531000018119812},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3330000042915344},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.3330000042915344},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.2919999957084656},{"id":"https://openalex.org/C28761237","wikidata":"https://www.wikidata.org/wiki/Q7805321","display_name":"Time horizon","level":2,"score":0.289900004863739},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2531000077724457},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.14938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.14938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"rapid":[1],"progress":[2],"in":[3,36],"autonomous":[4,58,94,171],"driving,":[5],"reliable":[6],"training":[7,122],"and":[8,21,39,49,67,76,115,130,138],"evaluation":[9],"of":[10,19,125],"driving":[11,59,172],"systems":[12],"remain":[13],"fundamentally":[14],"constrained":[15],"by":[16],"the":[17,158],"lack":[18],"scalable":[20],"interactive":[22],"simulation":[23,173],"environments.":[24],"Recent":[25],"generative":[26],"video":[27,90],"models":[28],"achieve":[29],"remarkable":[30],"visual":[31],"fidelity,":[32],"yet":[33],"most":[34],"operate":[35],"open-loop":[37],"settings":[38],"fail":[40],"to":[41],"support":[42],"fine-grained":[43,103],"frame-level":[44,88],"interaction":[45,145],"between":[46],"agent":[47],"actions":[48],"environment":[50],"evolution.":[51],"Building":[52],"a":[53,87,98,120,180],"learning-based":[54],"closed-loop":[55,170],"simulator":[56],"for":[57,93,153],"poses":[60],"three":[61],"major":[62],"challenges:":[63],"maintaining":[64,176],"long-horizon":[65,113],"temporal":[66],"cross-view":[68],"consistency,":[69],"mitigating":[70],"autoregressive":[71,89,132],"degradation":[72],"under":[73,140],"iterative":[74,116],"self-conditioning,":[75],"satisfying":[77],"low-latency":[78,144],"inference":[79,154],"constraints.":[80],"In":[81],"this":[82],"work,":[83],"we":[84,118,147],"propose":[85],"FAR-Drive,":[86],"generation":[91],"framework":[92],"driving.":[95],"We":[96],"introduce":[97],"multi-view":[99],"diffusion":[100],"transformer":[101],"with":[102],"structured":[104],"control,":[105],"enabling":[106],"geometrically":[107],"consistent":[108],"multi-camera":[109],"generation.":[110],"To":[111,142],"address":[112],"consistency":[114,137],"degradation,":[117],"design":[119],"two-stage":[121],"strategy":[123],"consisting":[124],"adaptive":[126],"reference":[127],"horizon":[128],"conditioning":[129],"blend-forcing":[131],"training,":[133],"which":[134],"progressively":[135],"improves":[136],"robustness":[139],"self-conditioning.":[141],"meet":[143],"requirements,":[146],"further":[148],"integrate":[149],"system-level":[150],"efficiency":[151],"optimizations":[152],"acceleration.":[155],"Experiments":[156],"on":[157,179],"nuScenes":[159],"dataset":[160],"demonstrate":[161],"that":[162],"our":[163],"method":[164],"achieves":[165],"state-of-the-art":[166],"performance":[167],"among":[168],"existing":[169],"approaches,":[174],"while":[175],"sub-second":[177],"latency":[178],"single":[181],"GPU.":[182]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-18T00:00:00"}
