{"id":"https://openalex.org/W7157576305","doi":"https://doi.org/10.48550/arxiv.2604.24842","title":"Co-Director: Agentic Generative Video Storytelling","display_name":"Co-Director: Agentic Generative Video Storytelling","publication_year":2026,"publication_date":"2026-04-27","ids":{"openalex":"https://openalex.org/W7157576305","doi":"https://doi.org/10.48550/arxiv.2604.24842"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.24842","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.24842","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100566791","display_name":"Yale Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Song, Yale","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134829953","display_name":"Yiwen Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yiwen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134855444","display_name":"Nick Losier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Losier, Nick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134846304","display_name":"Nathan Hodson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hodson, Nathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134865482","display_name":"Ye Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Ye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134858233","display_name":"Rhyard Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Rhyard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134850377","display_name":"Yan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075636031","display_name":"Daniel Vlasic","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vlasic, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134836279","display_name":"Carina Claassen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Claassen, Carina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134828921","display_name":"Jasmine Leon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Leon, Jasmine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134869222","display_name":"Khanh G. LeViet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"LeViet, Khanh G.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134847453","display_name":"Zack Chomyn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chomyn, Zack","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058120342","display_name":"Joe Timmons","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Timmons, Joe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134842583","display_name":"Brett Slatkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Slatkin, Brett","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015095925","display_name":"Scott Penberthy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Penberthy, Scott","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134855891","display_name":"Tomas Pfister","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pfister, Tomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5100566791"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.36480000615119934,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.36480000615119934,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.19670000672340393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.14300000667572021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.7408999800682068},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.6366000175476074},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5674999952316284},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.45089998841285706},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.4316999912261963},{"id":"https://openalex.org/keywords/interactive-storytelling","display_name":"Interactive storytelling","score":0.3864000141620636},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.3212999999523163},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3160000145435333}],"concepts":[{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.7408999800682068},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.732699990272522},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.6366000175476074},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5674999952316284},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.45089998841285706},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.4316999912261963},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.4189999997615814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39660000801086426},{"id":"https://openalex.org/C2779754051","wikidata":"https://www.wikidata.org/wiki/Q2903135","display_name":"Interactive storytelling","level":4,"score":0.3864000141620636},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3855000138282776},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3212999999523163},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.30410000681877136},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.29330000281333923},{"id":"https://openalex.org/C2780554381","wikidata":"https://www.wikidata.org/wiki/Q2063340","display_name":"Sensemaking","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C186886427","wikidata":"https://www.wikidata.org/wiki/Q5441213","display_name":"Feedback loop","level":2,"score":0.26510000228881836},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.24842","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.24842","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"diffusion":[1],"models":[2],"generate":[3],"high-fidelity":[4],"video":[5,44],"clips,":[6],"transforming":[7],"them":[8],"into":[9],"coherent":[10],"storytelling":[11,45],"engines":[12],"remains":[13],"challenging.":[14],"Current":[15],"agentic":[16],"pipelines":[17],"automate":[18],"this":[19],"via":[20],"chained":[21],"modules":[22],"but":[23],"suffer":[24],"from":[25],"semantic":[26,53],"drift":[27,75],"and":[28,76],"cascading":[29],"failures":[30],"due":[31],"to":[32,124],"independent,":[33],"handcrafted":[34],"prompting.":[35],"We":[36],"present":[37],"Co-Director,":[38],"a":[39,47,59,68,100,118],"hierarchical":[40,57],"multi-agent":[41],"framework":[42],"formalizing":[43],"as":[46],"global":[48],"optimization":[49],"problem.":[50],"To":[51],"ensure":[52],"coherence,":[54],"we":[55,97],"introduce":[56,98],"parameterization:":[58],"multi-armed":[60],"bandit":[61],"globally":[62],"identifies":[63],"promising":[64],"creative":[65,93],"directions,":[66],"while":[67],"local":[69],"multimodal":[70],"self-refinement":[71],"loop":[72],"mitigates":[73],"identity":[74],"ensures":[77],"sequence-level":[78],"consistency.":[79],"This":[80],"balances":[81],"the":[82,89],"exploration":[83],"of":[84,91,103],"novel":[85],"narrative":[86],"strategies":[87],"with":[88],"exploitation":[90],"effective":[92],"configurations.":[94],"For":[95],"evaluation,":[96],"GenAD-Bench,":[99],"400-scenario":[101],"dataset":[102],"fictional":[104],"products":[105],"for":[106],"personalized":[107],"advertising.":[108],"Experiments":[109],"demonstrate":[110],"that":[111,121],"Co-Director":[112],"significantly":[113],"outperforms":[114],"state-of-the-art":[115],"baselines,":[116],"offering":[117],"principled":[119],"approach":[120],"seamlessly":[122],"generalizes":[123],"broader":[125],"cinematic":[126],"narratives.":[127],"Project":[128],"Page:":[129],"https://co-director-agent.github.io/":[130]},"counts_by_year":[],"updated_date":"2026-04-30T06:11:10.768123","created_date":"2026-04-30T00:00:00"}
