{"id":"https://openalex.org/W4404308559","doi":"https://doi.org/10.48550/arxiv.2410.18072","title":"WorldSimBench: Towards Video Generation Models as World Simulators","display_name":"WorldSimBench: Towards Video Generation Models as World Simulators","publication_year":2024,"publication_date":"2024-10-23","ids":{"openalex":"https://openalex.org/W4404308559","doi":"https://doi.org/10.48550/arxiv.2410.18072"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2410.18072","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.18072","pdf_url":"https://arxiv.org/pdf/2410.18072","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2410.18072","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113116658","display_name":"Yiran Qin","orcid":"https://orcid.org/0009-0008-4561-0685"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qin, Yiran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031242463","display_name":"Zhelun Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Zhelun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112281651","display_name":"Jiwen Yu","orcid":"https://orcid.org/0000-0001-8577-183X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jiwen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100709594","display_name":"Xijun Wang","orcid":"https://orcid.org/0000-0002-0949-3492"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xijun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102521317","display_name":"Enshen Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Enshen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100376791","display_name":"Lijun Li","orcid":"https://orcid.org/0000-0002-8760-3722"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Lijun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063953932","display_name":"Zhenfei Yin","orcid":"https://orcid.org/0000-0002-8666-1103"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Zhenfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027234036","display_name":"Xihui Liu","orcid":"https://orcid.org/0000-0002-1791-8745"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xihui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054666319","display_name":"Sheng Lu","orcid":"https://orcid.org/0000-0001-7532-8981"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheng, Lu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102006926","display_name":"Jing Shao","orcid":"https://orcid.org/0000-0002-2500-2366"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Jing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014537649","display_name":"Lei Bai","orcid":"https://orcid.org/0000-0001-8968-3386"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087818121","display_name":"Wanli Ouyang","orcid":"https://orcid.org/0000-0002-9163-2761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ouyang, Wanli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003608795","display_name":"Ruimao Zhang","orcid":"https://orcid.org/0000-0001-9511-7532"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ruimao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5113116658"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12698","display_name":"3D Modeling in Geospatial Applications","score":0.585099995136261,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12698","display_name":"3D Modeling in Geospatial Applications","score":0.585099995136261,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11195","display_name":"Simulation Techniques and Applications","score":0.5478000044822693,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.4975000023841858,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47787562012672424},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.43682777881622314}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47787562012672424},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.43682777881622314}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2410.18072","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.18072","pdf_url":"https://arxiv.org/pdf/2410.18072","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:hub.hku.hk:10722/359198","is_oa":false,"landing_page_url":"https://hub.hku.hk/handle/10722/359198","pdf_url":null,"source":{"id":"https://openalex.org/S4377196271","display_name":"The HKU Scholars Hub (University of Hong Kong)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I889458895","host_organization_name":"University of Hong Kong","host_organization_lineage":["https://openalex.org/I889458895"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference_Paper"},{"id":"doi:10.48550/arxiv.2410.18072","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2410.18072","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.18072","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.18072","pdf_url":"https://arxiv.org/pdf/2410.18072","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Recent":[0],"advancements":[1],"in":[2,9,71,103,190,204],"predictive":[3,33,47,61],"models":[4,48,62],"have":[5],"demonstrated":[6],"exceptional":[7],"capabilities":[8],"predicting":[10],"the":[11,19,30,58,68,97,120,126,155,162,168,177,186],"future":[12],"state":[13],"of":[14,21,32,60,158,171],"objects":[15],"and":[16,66,88,100,116,152],"scenes.":[17],"However,":[18],"lack":[20],"categorization":[22],"based":[23,133],"on":[24,134],"inherent":[25],"characteristics":[26],"continues":[27],"to":[28,41,141],"hinder":[29],"progress":[31],"model":[34],"development.":[35],"Additionally,":[36],"existing":[37],"benchmarks":[38],"are":[39],"unable":[40],"effectively":[42],"evaluate":[43],"higher-capability,":[44],"highly":[45],"embodied":[46,51,104,109,216],"from":[49,96],"an":[50],"perspective.":[52],"In":[53,119,161],"this":[54],"work,":[55],"we":[56,124,139,166],"classify":[57],"functionalities":[59],"into":[63,185],"a":[64,77,129,143,212],"hierarchy":[65],"take":[67],"first":[69],"step":[70],"evaluating":[72,175],"World":[73,159,172,209],"Simulators":[74,173,210],"by":[75,174],"proposing":[76],"dual":[78],"evaluation":[79,195],"framework":[80],"called":[81],"WorldSimBench.":[82],"WorldSimBench":[83],"includes":[84],"Explicit":[85,121],"Perceptual":[86,122],"Evaluation":[87],"Implicit":[89,163],"Manipulative":[90,164],"Evaluation,":[91,123,165],"encompassing":[92],"human":[93,136,150],"preference":[94],"assessments":[95],"visual":[98,156],"perspective":[99],"action-level":[101],"evaluations":[102],"tasks,":[105],"covering":[106],"three":[107],"representative":[108],"scenarios:":[110],"Open-Ended":[111],"Embodied":[112],"Environment,":[113],"Autonomous,":[114],"Driving,":[115],"Robot":[117],"Manipulation.":[118],"introduce":[125],"HF-Embodied":[127],"Dataset,":[128],"video":[130,180,205],"assessment":[131],"dataset":[132],"fine-grained":[135],"feedback,":[137],"which":[138],"use":[140],"train":[142],"Human":[144],"Preference":[145],"Evaluator":[146],"that":[147,199],"aligns":[148],"with":[149],"perception":[151],"explicitly":[153],"assesses":[154],"fidelity":[157],"Simulators.":[160],"assess":[167],"video-action":[169],"consistency":[170],"whether":[176],"generated":[178],"situation-aware":[179],"can":[181,200],"be":[182],"accurately":[183],"translated":[184],"correct":[187],"control":[188],"signals":[189],"dynamic":[191],"environments.":[192],"Our":[193],"comprehensive":[194],"offers":[196],"key":[197],"insights":[198],"drive":[201],"further":[202],"innovation":[203],"generation":[206],"models,":[207],"positioning":[208],"as":[211],"pivotal":[213],"advancement":[214],"toward":[215],"artificial":[217],"intelligence.":[218]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
