{"id":"https://openalex.org/W7140179945","doi":"https://doi.org/10.48550/arxiv.2603.22212","title":"Omni-WorldBench: Towards a Comprehensive Interaction-Centric Evaluation for World Models","display_name":"Omni-WorldBench: Towards a Comprehensive Interaction-Centric Evaluation for World Models","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140179945","doi":"https://doi.org/10.48550/arxiv.2603.22212"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22212","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wu, Meiqi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wu, Meiqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Cai, Zhixin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Zhixin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhao, Fufangchen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Fufangchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Feng, Xiaokun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Xiaokun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Dang, Rujing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dang, Rujing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Song, Bingze","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Bingze","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Tian, Ruitian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Ruitian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhu, Jiashu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Jiashu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Lei, Jiachen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei, Jiachen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Dou, Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dou, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Tang, Jing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Jing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Sun, Lei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Lei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wu, Jiahong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jiahong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Chu, Xiangxiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu, Xiangxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Zeming","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zeming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Huang, Kaiqi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Kaiqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.5349000096321106,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.5349000096321106,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.13519999384880066,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.060100000351667404,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.6284999847412109},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6036999821662903},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5044999718666077},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4950999915599823},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.46880000829696655},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.40860000252723694},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.3824999928474426}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7041000127792358},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.6284999847412109},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6036999821662903},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5044999718666077},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4950999915599823},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.46299999952316284},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.40860000252723694},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3984000086784363},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3824999928474426},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.33070001006126404},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32420000433921814},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31290000677108765},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3122999966144562},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.29339998960494995},{"id":"https://openalex.org/C2776289891","wikidata":"https://www.wikidata.org/wiki/Q1931511","display_name":"Neglect","level":2,"score":0.2883000075817108},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2883000075817108}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video--based":[0],"world":[1,48,114,144,171,183,205],"models":[2,56,115,172,184],"have":[3],"emerged":[4],"along":[5],"two":[6,121],"dominant":[7],"paradigms:":[8],"video":[9],"generation":[10],"and":[11,24,59,84,133,136,159],"3D":[12,34],"reconstruction.":[13],"However,":[14],"existing":[15,88],"evaluation":[16,140],"benchmarks":[17],"either":[18],"focus":[19],"narrowly":[20],"on":[21,32,155],"visual":[22],"fidelity":[23],"text--video":[25],"alignment":[26],"for":[27,191],"generative":[28],"models,":[29],"or":[30],"rely":[31],"static":[33],"reconstruction":[35],"metrics":[36],"that":[37,44,142],"fundamentally":[38],"neglect":[39],"temporal":[40,60],"dynamics.":[41],"We":[42,164],"argue":[43],"the":[45,65,71,109,149],"future":[46,192],"of":[47,113,152,168,181],"modeling":[49,145],"lies":[50],"in":[51,116,185,202],"4D":[52,117,204],"generation,":[53],"which":[54],"jointly":[55],"spatial":[57],"structure":[58],"evolution.":[61],"In":[62],"this":[63,92,97],"paradigm,":[64],"core":[66],"capability":[67],"is":[68],"interactive":[69,110,186,203],"response:":[70],"ability":[72],"to":[73,107,199],"faithfully":[74],"reflect":[75],"how":[76],"interaction":[77,131,153],"actions":[78,154],"drive":[79],"state":[80,161],"transitions":[81],"across":[82,173],"space":[83],"time.":[85],"Yet":[86],"no":[87],"benchmark":[89,104],"systematically":[90],"evaluates":[91],"critical":[93,179],"dimension.":[94],"To":[95],"address":[96],"gap,":[98],"we":[99],"propose":[100],"Omni--WorldBench,":[101],"a":[102,125],"comprehensive":[103],"specifically":[105],"designed":[106],"evaluate":[108],"response":[111],"capabilities":[112,146],"settings.":[118],"Omni--WorldBench":[119],"comprises":[120],"key":[122],"components:":[123],"Omni--WorldSuite,":[124],"systematic":[126],"prompt":[127],"suite":[128],"spanning":[129],"diverse":[130],"levels":[132],"scene":[134],"types;":[135],"Omni--Metrics,":[137],"an":[138],"agent-based":[139],"framework":[141],"quantifies":[143],"by":[147],"measuring":[148],"causal":[150],"impact":[151],"both":[156],"final":[157],"outcomes":[158],"intermediate":[160],"evolution":[162],"trajectories.":[163],"conduct":[165],"extensive":[166],"evaluations":[167],"18":[169],"representative":[170],"multiple":[174],"paradigms.":[175],"Our":[176],"analysis":[177],"reveals":[178],"limitations":[180],"current":[182],"response,":[187],"providing":[188],"actionable":[189],"insights":[190],"research.":[193],"Omni-WorldBench":[194],"will":[195],"be":[196],"publicly":[197],"released":[198],"foster":[200],"progress":[201],"modeling.":[206]},"counts_by_year":[],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2026-03-25T00:00:00"}
