{"id":"https://openalex.org/W7154616844","doi":"https://doi.org/10.48550/arxiv.2604.13452","title":"CANVAS: Continuity-Aware Narratives via Visual Agentic Storyboarding","display_name":"CANVAS: Continuity-Aware Narratives via Visual Agentic Storyboarding","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154616844","doi":"https://doi.org/10.48550/arxiv.2604.13452"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.13452","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13452","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.13452","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002257824","display_name":"Ishani Mondal","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mondal, Ishani","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133742557","display_name":"Yiwen Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yiwen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133752119","display_name":"Mihir Parmar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parmar, Mihir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011797382","display_name":"Palash Goyal","orcid":"https://orcid.org/0000-0003-2455-2160"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goyal, Palash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081307846","display_name":"Jordan Boyd\u2010Graber","orcid":"https://orcid.org/0000-0002-7770-4431"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boyd-Graber, Jordan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133789181","display_name":"Tomas Pfister","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pfister, Tomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100566791","display_name":"Yale Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yale","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5002257824"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.4787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.4787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2896000146865845,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.04800000041723251,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.7746999859809875},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5442000031471252},{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.5275999903678894},{"id":"https://openalex.org/keywords/storyboard","display_name":"Storyboard","score":0.5123999714851379},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.44530001282691956},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.39250001311302185},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.3700000047683716}],"concepts":[{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.7746999859809875},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5846999883651733},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5442000031471252},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.5275999903678894},{"id":"https://openalex.org/C2777080924","wikidata":"https://www.wikidata.org/wiki/Q334667","display_name":"Storyboard","level":2,"score":0.5123999714851379},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.44530001282691956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41819998621940613},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.39250001311302185},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.3700000047683716},{"id":"https://openalex.org/C2778734905","wikidata":"https://www.wikidata.org/wiki/Q15130689","display_name":"Reinterpretation","level":2,"score":0.3628999888896942},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.3625999987125397},{"id":"https://openalex.org/C2780554381","wikidata":"https://www.wikidata.org/wiki/Q2063340","display_name":"Sensemaking","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.33149999380111694},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3010999858379364},{"id":"https://openalex.org/C2779754051","wikidata":"https://www.wikidata.org/wiki/Q2903135","display_name":"Interactive storytelling","level":4,"score":0.2800999879837036},{"id":"https://openalex.org/C119657128","wikidata":"https://www.wikidata.org/wiki/Q11633","display_name":"Photography","level":2,"score":0.2793999910354614},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.27390000224113464},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2662000060081482},{"id":"https://openalex.org/C107038049","wikidata":"https://www.wikidata.org/wiki/Q35986","display_name":"Aesthetics","level":1,"score":0.2660999894142151},{"id":"https://openalex.org/C13200473","wikidata":"https://www.wikidata.org/wiki/Q2747831","display_name":"Reflexivity","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.25760000944137573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.13452","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13452","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.13452","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13452","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.5888200402259827,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Long-form":[0],"visual":[1,57],"storytelling":[2],"requires":[3],"maintaining":[4],"continuity":[5,58,112],"across":[6],"shots,":[7],"including":[8],"consistent":[9],"characters,":[10],"stable":[11],"environments,":[12],"and":[13,38,71,91,93,119],"smooth":[14,76],"scene":[15,40,73],"transitions.":[16],"While":[17],"existing":[18],"generative":[19],"models":[20],"can":[21],"produce":[22],"strong":[23],"individual":[24],"frames,":[25],"they":[26],"fail":[27],"to":[28,33],"preserve":[29],"such":[30],"continuity,":[31,67],"leading":[32],"appearance":[34],"changes,":[35],"inconsistent":[36],"backgrounds,":[37],"abrupt":[39],"shifts.":[41],"We":[42,82],"introduce":[43,94],"CANVAS":[44,62,84,104],"(Continuity-Aware":[45],"Narratives":[46],"via":[47],"Visual":[48],"Agentic":[49],"Storyboarding),":[50],"a":[51,95],"multi-agent":[52],"framework":[53],"that":[54],"explicitly":[55],"plans":[56],"in":[59],"multi-shot":[60],"narratives.":[61],"enforces":[63],"coherence":[64],"through":[65],"character":[66,115],"persistent":[68],"background":[69,111],"anchors,":[70],"location-aware":[72],"planning":[74],"for":[75,100],"transitions":[77],"within":[78],"the":[79,107],"same":[80],"setting":[81],"evaluate":[83],"on":[85],"two":[86],"storyboard":[87],"generation":[88],"benchmarks":[89],"ST-BENCH":[90],"ViStoryBench":[92],"new":[96],"challenging":[97],"benchmark":[98],"HardContinuityBench":[99],"long-range":[101],"narrative":[102],"consistency.":[103],"consistently":[105],"outperforms":[106],"best-performing":[108],"baseline,":[109],"improving":[110],"by":[113,117,122],"21.6%,":[114],"consistency":[116,121],"9.6%":[118],"props":[120],"7.6%.":[123]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-17T00:00:00"}
