{"id":"https://openalex.org/W7154424237","doi":"https://doi.org/10.48550/arxiv.2604.10103","title":"Long-Horizon Streaming Video Generation via Hybrid Attention with Decoupled Distillation","display_name":"Long-Horizon Streaming Video Generation via Hybrid Attention with Decoupled Distillation","publication_year":2026,"publication_date":"2026-04-11","ids":{"openalex":"https://openalex.org/W7154424237","doi":"https://doi.org/10.48550/arxiv.2604.10103"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.10103","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10103","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.10103","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133601096","display_name":"Ruibin Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Ruibin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065875464","display_name":"Tao Yang","orcid":"https://orcid.org/0000-0002-2276-4023"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Tao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133608710","display_name":"Fangzhou Ai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ai, Fangzhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063972231","display_name":"Tianhe Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tianhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133576332","display_name":"Shilei Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Shilei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133608377","display_name":"Bingyue Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Bingyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133587577","display_name":"Lei Zhang","orcid":"https://orcid.org/0009-0006-7934-056X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5133601096"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.3156999945640564,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.3156999945640564,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.17630000412464142,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.05299999937415123,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.569599986076355},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.5073000192642212},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.4690000116825104},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.46380001306533813},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4596000015735626},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.4528000056743622},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.4165000021457672},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.38179999589920044}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8198999762535095},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.569599986076355},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.5073000192642212},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.4690000116825104},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.46380001306533813},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4596000015735626},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.4528000056743622},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4345000088214874},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.4165000021457672},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.38179999589920044},{"id":"https://openalex.org/C102392041","wikidata":"https://www.wikidata.org/wiki/Q592860","display_name":"Sliding window protocol","level":3,"score":0.3650999963283539},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.33340001106262207},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32899999618530273},{"id":"https://openalex.org/C76100544","wikidata":"https://www.wikidata.org/wiki/Q4118095","display_name":"Batch distillation","level":4,"score":0.3156999945640564},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.28610000014305115},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.2824000120162964},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.2667999863624573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.10103","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10103","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.10103","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10103","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Streaming":[0],"video":[1,8,29,172,190],"generation":[2,173,191],"(SVG)":[3],"distills":[4],"a":[5,36,59,82,127,196],"pretrained":[6],"bidirectional":[7],"diffusion":[9],"model":[10,14,185,204],"into":[11,105],"an":[12],"autoregressive":[13],"equipped":[15],"with":[16,94],"sliding":[17,76,108],"window":[18,109],"attention":[19,61,69,104,135,156],"(SWA).":[20],"However,":[21],"SWA":[22],"inevitably":[23],"loses":[24],"distant":[25],"history":[26],"during":[27],"long":[28],"generation,":[30],"and":[31,55,97,154,170,209],"its":[32],"computational":[33,56,98,118],"overhead":[34],"remains":[35],"critical":[37,122],"challenge":[38],"to":[39,70,86,110,132],"real-time":[40],"deployment.":[41],"In":[42,78],"this":[43],"work,":[44],"we":[45,64,80,101,125],"propose":[46],"Hybrid":[47,177],"Forcing,":[48],"which":[49],"jointly":[50],"optimizes":[51],"temporal":[52,68,92,153],"information":[53],"retention":[54],"efficiency":[57],"through":[58],"hybrid":[60,134],"design.":[62,136],"First,":[63],"introduce":[65,126],"lightweight":[66],"linear":[67,152],"preserve":[71],"long-range":[72],"dependencies":[73],"beyond":[74],"the":[75,106,133,147],"window.":[77],"particular,":[79],"maintain":[81],"compact":[83],"key-value":[84],"state":[85],"incrementally":[87],"absorb":[88],"evicted":[89],"tokens,":[90],"retaining":[91],"context":[93],"negligible":[95],"memory":[96],"overhead.":[99],"Second,":[100],"incorporate":[102],"block-sparse":[103,155],"local":[107],"reduce":[111],"redundant":[112],"computation":[113],"within":[114],"short-range":[115],"modeling,":[116,161],"reallocating":[117],"capacity":[119],"toward":[120],"more":[121],"dependencies.":[123],"Finally,":[124],"decoupled":[128],"distillation":[129,140,148],"strategy":[130],"tailored":[131],"A":[137],"few-step":[138],"initial":[139],"is":[141,157],"performed":[142],"under":[143],"dense":[144],"attention,":[145],"then":[146],"of":[149],"our":[150,184],"proposed":[151],"activated":[158],"for":[159],"streaming":[160],"ensuring":[162],"stable":[163],"optimization.":[164],"Extensive":[165],"experiments":[166],"on":[167,195],"both":[168],"short-":[169],"long-form":[171],"benchmarks":[174],"demonstrate":[175],"that":[176],"Forcing":[178],"consistently":[179],"achieves":[180,186],"state-of-the-art":[181],"performance.":[182],"Notably,":[183],"real-time,":[187],"unbounded":[188],"832x480":[189],"at":[192,214],"29.5":[193],"FPS":[194],"single":[197],"NVIDIA":[198],"H100":[199],"GPU":[200],"without":[201],"quantization":[202],"or":[203],"compression.":[205],"The":[206],"source":[207],"code":[208],"trained":[210],"models":[211],"are":[212],"available":[213],"https://github.com/leeruibin/hybrid-forcing.":[215]},"counts_by_year":[],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2026-04-15T00:00:00"}
