{"id":"https://openalex.org/W7162785817","doi":"https://doi.org/10.48550/arxiv.2605.30090","title":"DirectorBench: Diagnosing Long-Form Video Generation with Personalized Multi-Agent Evaluation","display_name":"DirectorBench: Diagnosing Long-Form Video Generation with Personalized Multi-Agent Evaluation","publication_year":2026,"publication_date":"2026-05-28","ids":{"openalex":"https://openalex.org/W7162785817","doi":"https://doi.org/10.48550/arxiv.2605.30090"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.30090","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30090","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.30090","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137373561","display_name":"Jiamin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011725324","display_name":"Qianben Chen","orcid":"https://orcid.org/0000-0003-2546-0225"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Qianben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137351288","display_name":"Jiawen Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiawen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101877822","display_name":"Yidi Wu","orcid":"https://orcid.org/0000-0002-9614-1312"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yidi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137324014","display_name":"Yuchen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yuchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137356627","display_name":"Xiaokun Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiaokun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074508950","display_name":"Wangchunshu Zhou","orcid":"https://orcid.org/0000-0003-4668-3348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Wangchunshu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137317928","display_name":"Chen Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2858999967575073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2858999967575073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.1679999977350235,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12720","display_name":"Multimedia Communication and Technology","score":0.06750000268220901,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8101999759674072},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7839999794960022},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7465999722480774},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.5827999711036682},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.5425999760627747},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5103999972343445},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4408000111579895}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8264999985694885},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8101999759674072},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7839999794960022},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7465999722480774},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.5827999711036682},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.5425999760627747},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5103999972343445},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4408000111579895},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43779999017715454},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.4284999966621399},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.35749998688697815},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33709999918937683},{"id":"https://openalex.org/C201025465","wikidata":"https://www.wikidata.org/wiki/Q11248500","display_name":"User experience design","level":2,"score":0.32420000433921814},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.27790001034736633},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2531000077724457},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25279998779296875},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.30090","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30090","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.30090","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30090","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Long-form":[0],"video":[1,65,115,202],"generation":[2,116],"is":[3],"rapidly":[4],"moving":[5],"from":[6],"short,":[7],"single-scene":[8],"synthesis":[9],"toward":[10],"minute-long,":[11],"multi-shot":[12],"creation":[13],"with":[14,71,156],"narrative":[15],"structure,":[16],"cinematic":[17],"control,":[18],"audio,":[19,90],"and":[20,45,52,81,92,107,121,137,165,177,180,197],"cross-modal":[21],"synchronization.":[22],"However,":[23],"evaluating":[24],"such":[25],"videos":[26,70],"remains":[27],"challenging,":[28],"since":[29],"existing":[30],"benchmarks":[31],"largely":[32],"focus":[33],"on":[34],"local":[35],"visual":[36],"quality,":[37],"short-horizon":[38],"temporal":[39],"consistency,":[40],"or":[41],"generic":[42],"prompt":[43],"alignment,":[44],"provide":[46],"limited":[47],"diagnosis":[48],"of":[49,95,195],"workflow":[50],"failures":[51],"user-dependent":[53],"preferences.":[54],"We":[55,111,151],"introduce":[56],"DirectorBench,":[57],"a":[58,99,129],"personalized":[59],"multi-agent":[60],"diagnostic":[61,196],"benchmark":[62],"for":[63,140,200],"long-form":[64,114,201],"generation.":[66,203],"DirectorBench":[67,103,127,164,172],"evaluates":[68],"generated":[69],"respect":[72],"to":[73,98,159],"80":[74],"structured":[75],"metadata":[76],"entries,":[77],"7":[78,122],"user":[79,123,146],"profiles,":[80],"40":[82],"checkpoint":[83],"criteria":[84],"across":[85],"5":[86],"dimensions:":[87],"script,":[88],"visual,":[89],"cross-modal,":[91],"stability.":[93],"Instead":[94],"reducing":[96],"quality":[97,133,175],"single":[100],"aggregate":[101,188],"score,":[102],"localizes":[104],"checkpoint-level":[105],"bottlenecks":[106],"supports":[108],"profile-aware":[109,198],"evaluation.":[110],"evaluate":[112],"4":[113],"workflows,":[117,126],"6":[118],"base":[119],"LLMs,":[120],"profiles.":[124],"Across":[125],"reveals":[128,178],"between-unit":[130],"bottleneck:":[131],"transition":[132],"averages":[134,149],"only":[135],"0.256":[136],"reaches":[138],"0.356":[139],"the":[141,161,193],"best":[142],"workflow,":[143],"while":[144],"prompt-level":[145],"demand":[147],"fulfillment":[148],"0.71.":[150],"further":[152],"conduct":[153],"human":[154,166],"evaluation":[155],"14":[157],"annotators":[158],"validate":[160],"alignment":[162],"between":[163],"judgment.":[167],"The":[168],"results":[169],"show":[170],"that":[171,184],"captures":[173],"human-perceptible":[174],"differences":[176],"workflow-":[179],"profile-dependent":[181],"failure":[182],"modes":[183],"are":[185],"hidden":[186],"by":[187],"scoring.":[189],"These":[190],"findings":[191],"highlight":[192],"importance":[194],"benchmarking":[199]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-30T00:00:00"}
