{"id":"https://openalex.org/W4415233025","doi":"https://doi.org/10.1109/wacv61042.2026.00626","title":"T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation","display_name":"T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W4415233025","doi":"https://doi.org/10.1109/wacv61042.2026.00626"},"language":"en","primary_location":{"id":"doi:10.1109/wacv61042.2026.00626","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.18107","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101542641","display_name":"Yu\u2010Bin Chen","orcid":"https://orcid.org/0000-0002-4302-266X"},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yubin Chen","raw_affiliation_strings":["San Jose State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"San Jose State University","institution_ids":["https://openalex.org/I51504820"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039643783","display_name":"Xuyang Guo","orcid":"https://orcid.org/0000-0002-1826-3082"},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuyang Guo","raw_affiliation_strings":["Guilin University of Electronic Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Guilin University of Electronic Technology","institution_ids":["https://openalex.org/I5343935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069272192","display_name":"Zhenmei Shi","orcid":"https://orcid.org/0009-0007-6741-7598"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhenmei Shi","raw_affiliation_strings":["University of Wisconsin-Madison"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Wisconsin-Madison","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091070408","display_name":"Zhao Song","orcid":"https://orcid.org/0000-0002-5535-2789"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhao Song","raw_affiliation_strings":["University of California,Berkeley"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California,Berkeley","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069110921","display_name":"Jiahao Zhang","orcid":"https://orcid.org/0000-0002-8066-5496"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiahao Zhang","raw_affiliation_strings":["University of Washington"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Washington","institution_ids":["https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00707778,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6474","last_page":"6485"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9783999919891357,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9165999889373779,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.8098000288009644},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5676000118255615},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5034999847412109},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.45649999380111694},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.328000009059906}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.8098000288009644},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6880999803543091},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5676000118255615},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.507099986076355},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5034999847412109},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47530001401901245},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.45649999380111694},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4408000111579895},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.29840001463890076},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.28839999437332153},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2741999924182892},{"id":"https://openalex.org/C115925183","wikidata":"https://www.wikidata.org/wiki/Q1412694","display_name":"Knowledge-based systems","level":2,"score":0.2554999887943268},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2551000118255615}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/wacv61042.2026.00626","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2507.18107","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.18107","pdf_url":"https://arxiv.org/pdf/2507.18107","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.18107","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.18107","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.18107","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.18107","pdf_url":"https://arxiv.org/pdf/2507.18107","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Text-to-video":[0],"(T2V)":[1],"models":[2,94,103,117,142,156],"have":[3],"shown":[4],"remarkable":[5],"performance":[6],"in":[7,136,175],"generating":[8],"visually":[9],"reasonable":[10],"scenes,":[11],"while":[12],"their":[13],"capability":[14,138],"to":[15,31,110,120,143],"leverage":[16,144],"world":[17,45,122,145],"knowledge":[18,46,123],"for":[19,42,154,160],"ensuring":[20],"semantic":[21],"consistency":[22],"and":[23,58,73,80,89,113,124,151,163,170],"factual":[24,164],"accuracy":[25],"remains":[26],"largely":[27],"understudied.":[28],"In":[29],"response":[30],"this":[32],"challenge,":[33],"we":[34],"propose":[35],"T2VWorldBench,":[36],"the":[37,44,98,137,167],"first":[38],"systematic":[39],"evaluation":[40,88,91,168],"framework":[41],"evaluating":[43],"generation":[47],"abilities":[48],"of":[49,65,139],"text-to-video":[50,102,141],"models,":[51,112],"covering":[52],"6":[53],"major":[54],"categories,":[55],"60":[56],"subcategories,":[57],"1,200":[59],"prompts":[60,169],"across":[61],"a":[62,133],"wide":[63],"range":[64],"domains,":[66],"including":[67],"physics,":[68],"nature,":[69],"activity,":[70],"culture,":[71],"causality,":[72],"object.":[74],"To":[75],"address":[76],"both":[77,86],"human":[78,87],"preference":[79],"scalable":[81],"evaluation,":[82],"our":[83],"benchmark":[84],"incorporates":[85],"automated":[90],"using":[92],"vision-language":[93],"(VLMs).":[95],"We":[96],"evaluated":[97],"10":[99],"most":[100,116],"advanced":[101],"currently":[104],"available,":[105],"ranging":[106],"from":[107],"open":[108],"source":[109],"commercial":[111],"found":[114,174],"that":[115],"are":[118],"unable":[119],"understand":[121],"generate":[125],"truly":[126],"correct":[127],"videos.":[128],"These":[129],"findings":[130],"point":[131],"out":[132],"critical":[134],"gap":[135],"current":[140],"knowledge,":[146],"providing":[147],"valuable":[148],"research":[149],"opportunities":[150],"entry":[152],"points":[153],"constructing":[155],"with":[157],"robust":[158],"capabilities":[159],"commonsense":[161],"reasoning":[162],"generation.":[165],"All":[166],"code":[171],"can":[172],"be":[173],"https://github.com/magiclinux/world_knowledge.":[176]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-16T00:00:00"}
