{"id":"https://openalex.org/W7133695445","doi":"https://doi.org/10.48550/arxiv.2603.03646","title":"InfinityStory: Unlimited Video Generation with World Consistency and Character-Aware Shot Transitions","display_name":"InfinityStory: Unlimited Video Generation with World Consistency and Character-Aware Shot Transitions","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7133695445","doi":"https://doi.org/10.48550/arxiv.2603.03646"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.03646","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128156979","display_name":"Mohamed Elmoghany","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Elmoghany, Mohamed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041967855","display_name":"Liangbing Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Liangbing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020511969","display_name":"Xiaoqian Shen","orcid":"https://orcid.org/0000-0001-6284-520X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xiaoqian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128150010","display_name":"Subhojyoti Mukherjee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mukherjee, Subhojyoti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128137254","display_name":"Yang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128173283","display_name":"Gang Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Gang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070047759","display_name":"Viet Dac Lai","orcid":"https://orcid.org/0009-0008-1651-4619"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lai, Viet Dac","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128132297","display_name":"Seunghyun Yoon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoon, Seunghyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128185487","display_name":"Ryan Rossi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rossi, Ryan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127831170","display_name":"Abdullah Rashwan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rashwan, Abdullah","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128178943","display_name":"Puneet Mathur","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mathur, Puneet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128218166","display_name":"Varun Manjunatha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manjunatha, Varun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107453511","display_name":"Daksh Dangi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dangi, Daksh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128192991","display_name":"Chien Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Chien","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016933602","display_name":"Nedim Lipka","orcid":"https://orcid.org/0000-0002-3779-7784"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lipka, Nedim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128192108","display_name":"Trung Bui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bui, Trung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128209569","display_name":"Krishna Kumar Singh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Krishna Kumar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128145590","display_name":"Ruiyi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ruiyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027237221","display_name":"Xiaolei Huang","orcid":"https://orcid.org/0000-0003-0478-8715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Xiaolei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128183951","display_name":"Jaemin Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Jaemin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128205485","display_name":"Yu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072397278","display_name":"Namyong Park","orcid":"https://orcid.org/0000-0002-3344-2361"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Namyong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128186636","display_name":"Zhengzhong Tu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tu, Zhengzhong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128188515","display_name":"Hongjie Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hongjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038305381","display_name":"Hoda Eldardiry","orcid":"https://orcid.org/0000-0002-9712-6667"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eldardiry, Hoda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128183339","display_name":"Nesreen Ahmed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed, Nesreen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128211728","display_name":"Thien Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Thien","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128158331","display_name":"Dinesh Manocha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manocha, Dinesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128149973","display_name":"Mohamed Elhoseiny","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elhoseiny, Mohamed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028863551","display_name":"Franck Dernoncourt","orcid":"https://orcid.org/0000-0002-1119-1346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dernoncourt, Franck","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":30,"corresponding_author_ids":["https://openalex.org/A5128156979"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7232999801635742,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7232999801635742,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.08349999785423279,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.028200000524520874,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.7017999887466431},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.6187000274658203},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.49639999866485596},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.46939998865127563},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.45579999685287476},{"id":"https://openalex.org/keywords/transition","display_name":"Transition (genetics)","score":0.44429999589920044},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4083999991416931},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.38989999890327454},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.35339999198913574}],"concepts":[{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.7017999887466431},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6973999738693237},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.6187000274658203},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5436999797821045},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.49639999866485596},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47290000319480896},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.46939998865127563},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.45579999685287476},{"id":"https://openalex.org/C194232998","wikidata":"https://www.wikidata.org/wiki/Q1606712","display_name":"Transition (genetics)","level":3,"score":0.44429999589920044},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4083999991416931},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.38989999890327454},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.35339999198913574},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.33899998664855957},{"id":"https://openalex.org/C137105694","wikidata":"https://www.wikidata.org/wiki/Q3407510","display_name":"Local consistency","level":4,"score":0.321399986743927},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.3172999918460846},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3107999861240387},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C31388003","wikidata":"https://www.wikidata.org/wiki/Q7624548","display_name":"Strong consistency","level":3,"score":0.2948000133037567},{"id":"https://openalex.org/C2992734406","wikidata":"https://www.wikidata.org/wiki/Q413267","display_name":"One shot","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C2780575108","wikidata":"https://www.wikidata.org/wiki/Q7316652","display_name":"Retargeting","level":2,"score":0.2775999903678894},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C37279795","wikidata":"https://www.wikidata.org/wiki/Q2492305","display_name":"Consistency model","level":3,"score":0.27059999108314514},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2551000118255615},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C2778701210","wikidata":"https://www.wikidata.org/wiki/Q28130034","display_name":"Constructive","level":3,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.03646","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.03646","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.03646","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.03646","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generating":[0],"long-form":[1],"storytelling":[2],"videos":[3],"with":[4,98],"consistent":[5],"visual":[6,51],"narratives":[7],"remains":[8],"a":[9,17,22,45,65,99],"significant":[10],"challenge":[11],"in":[12],"video":[13,67],"synthesis.":[14],"We":[15,62],"present":[16],"novel":[18],"framework,":[19],"dataset,":[20],"and":[21,37,59,125,137],"model":[23],"that":[24,49,70],"address":[25],"three":[26],"critical":[27],"limitations:":[28],"background":[29],"consistency":[30],"across":[31,53],"shots,":[32],"seamless":[33],"multi-subject":[34,104],"shot-to-shot":[35],"transitions,":[36,136],"scalability":[38],"to":[39],"hour-long":[40],"narratives.":[41],"Our":[42],"approach":[43],"introduces":[44],"background-consistent":[46],"generation":[47],"pipeline":[48],"maintains":[50],"coherence":[52],"scenes":[54],"while":[55],"preserving":[56],"character":[57],"identity":[58],"spatial":[60],"relationships.":[61],"further":[63],"propose":[64],"transition-aware":[66],"synthesis":[68],"module":[69],"generates":[71],"smooth":[72],"shot":[73],"transitions":[74],"for":[75],"complex":[76],"scenarios":[77],"involving":[78],"multiple":[79],"subjects":[80],"entering":[81],"or":[82],"exiting":[83],"frames,":[84],"going":[85],"beyond":[86],"the":[87,116,126],"single-subject":[88],"limitations":[89],"of":[90,102],"prior":[91],"work.":[92],"To":[93],"support":[94],"this,":[95],"we":[96],"contribute":[97],"synthetic":[100],"dataset":[101],"10,000":[103],"transition":[105],"sequences":[106],"covering":[107],"underrepresented":[108],"dynamic":[109],"scene":[110],"compositions.":[111],"On":[112],"VBench,":[113],"InfinityStory":[114],"achieves":[115],"highest":[117,121],"Background":[118],"Consistency":[119,123],"(88.94),":[120],"Subject":[122],"(82.11),":[124],"best":[127],"overall":[128],"average":[129],"rank":[130],"(2.80),":[131],"showing":[132],"improved":[133],"stability,":[134],"smoother":[135],"better":[138],"temporal":[139],"coherence.":[140]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-06T00:00:00"}
