{"id":"https://openalex.org/W7161298752","doi":"https://doi.org/10.48550/arxiv.2605.15141","title":"Causal Forcing++: Scalable Few-Step Autoregressive Diffusion Distillation for Real-Time Interactive Video Generation","display_name":"Causal Forcing++: Scalable Few-Step Autoregressive Diffusion Distillation for Real-Time Interactive Video Generation","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161298752","doi":"https://doi.org/10.48550/arxiv.2605.15141"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.15141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.15141","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136198931","display_name":"Min Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Min","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136191683","display_name":"Hongzhou Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Hongzhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136223225","display_name":"Kaiwen Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Kaiwen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136258165","display_name":"Zihan Zhou","orcid":"https://orcid.org/0009-0002-9375-1905"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zihan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045226094","display_name":"Bokai Yan","orcid":"https://orcid.org/0000-0001-7659-5694"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Bokai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136192228","display_name":"Xinyuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xinyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136208846","display_name":"Xiao Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136219760","display_name":"Chongxuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chongxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136268278","display_name":"Jun Zhu","orcid":"https://orcid.org/0009-0006-7668-2425"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7961999773979187,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7961999773979187,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.03550000116229057,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.024800000712275505,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.734000027179718},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.685699999332428},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.6711999773979187},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5680999755859375},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.48539999127388},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.47929999232292175},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4020000100135803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7642999887466431},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.734000027179718},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.685699999332428},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.6711999773979187},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5680999755859375},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.48539999127388},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.47929999232292175},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4020000100135803},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.3711000084877014},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3637000024318695},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3449999988079071},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32120001316070557},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.3052000105381012},{"id":"https://openalex.org/C34862557","wikidata":"https://www.wikidata.org/wiki/Q178985","display_name":"Ode","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C138673069","wikidata":"https://www.wikidata.org/wiki/Q322229","display_name":"Tracing","level":2,"score":0.2849000096321106},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.2840000092983246},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.258899986743927},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2531999945640564},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.15141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.15141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Real-time":[0],"interactive":[1],"video":[2],"generation":[3,214],"requires":[4],"low-latency,":[5],"streaming,":[6],"and":[7,42,98,147,159,188,198,223],"controllable":[8],"rollout.":[9],"Existing":[10],"autoregressive":[11],"(AR)":[12],"diffusion":[13],"distillation":[14],"methods":[15],"have":[16],"achieved":[17],"strong":[18],"results":[19],"in":[20,181,185,190,215],"the":[21,67,75,120,143,154,168,175,208,216],"chunk-wise":[22,171],"4-step":[23,170],"regime":[24],"by":[25,38,179,196,203],"distilling":[26],"bidirectional":[27],"base":[28],"models":[29],"into":[30],"few-step":[31,71,85,109],"AR":[32,72,110],"students,":[33],"but":[34,129],"they":[35],"remain":[36],"limited":[37],"coarse":[39],"response":[40],"granularity":[41],"non-negligible":[43],"sampling":[44,60],"latency.":[45],"In":[46,62],"this":[47,63],"paper,":[48],"we":[49,65],"study":[50],"a":[51,70,96,133],"more":[52,157],"aggressive":[53],"setting:":[54],"frame-wise":[55],"autoregression":[56],"with":[57],"only":[58],"1--2":[59],"steps.":[61],"regime,":[64],"identify":[66],"initialization":[68,155],"of":[69,84,218],"student":[73],"as":[74,125],"key":[76],"bottleneck:":[77],"existing":[78],"strategies":[79],"are":[80],"either":[81],"target-misaligned,":[82],"incapable":[83],"generation,":[86],"or":[87],"too":[88],"costly":[89],"to":[90,145,161,210],"scale.":[91],"We":[92,205],"propose":[93],"\\textbf{Causal":[94],"Forcing++},":[95],"principled":[97],"scalable":[99],"pipeline":[100,209],"that":[101,116],"uses":[102],"\\emph{causal":[103],"consistency":[104],"distillation}":[105],"(causal":[106],"CD)":[107],"for":[108],"initialization.":[111],"The":[112,163],"core":[113],"idea":[114],"is":[115],"causal":[117,126],"CD":[118],"learns":[119],"same":[121],"AR-conditional":[122],"flow":[123],"map":[124],"ODE":[127,137],"distillation,":[128],"obtains":[130],"supervision":[131],"from":[132],"single":[134],"online":[135],"teacher":[136],"step":[138],"between":[139],"adjacent":[140],"timesteps,":[141],"avoiding":[142],"need":[144],"precompute":[146],"store":[148],"full":[149],"PF-ODE":[150],"trajectories.":[151],"This":[152],"makes":[153],"both":[156],"efficient":[158],"easier":[160],"optimize.":[162],"resulting":[164],"pipeline,":[165],"\\ours,":[166],"surpasses":[167],"SOTA":[169],"Causal":[172],"Forcing":[173],"under":[174],"\\textit{\\textbf{frame-wise":[176],"2-step":[177],"setting}}":[178],"0.1":[180],"VBench":[182,186],"Total,":[183],"0.3":[184],"Quality,":[187],"0.335":[189],"VisionReward,":[191],"while":[192],"reducing":[193],"first-frame":[194],"latency":[195],"50\\%":[197],"Stage":[199],"2":[200],"training":[201],"cost":[202],"$\\sim$$4\\times$.":[204],"further":[206],"extend":[207],"action-conditioned":[211],"world":[212],"model":[213],"spirit":[217],"Genie3.":[219],"Project":[220],"Page:":[221],"https://github.com/thu-ml/Causal-Forcing":[222],"https://github.com/shengshu-ai/minWM":[224],".":[225]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-16T00:00:00"}
