{"id":"https://openalex.org/W7155571331","doi":"https://doi.org/10.48550/arxiv.2604.21686","title":"WorldMark: A Unified Benchmark Suite for Interactive Video World Models","display_name":"WorldMark: A Unified Benchmark Suite for Interactive Video World Models","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7155571331","doi":"https://doi.org/10.48550/arxiv.2604.21686"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.21686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.21686","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134529899","display_name":"Xiaojie Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Xiaojie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134554135","display_name":"Zhengyuan Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Zhengyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134554935","display_name":"Kang He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Kang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134556860","display_name":"Yukang Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Yukang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134492899","display_name":"Xiaofeng Mao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Xiaofeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111026732","display_name":"Yuanyang Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Yuanyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134490110","display_name":"Kaipeng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Kaipeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078980036","display_name":"Yongtao Ge","orcid":"https://orcid.org/0000-0003-1265-3204"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ge, Yongtao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3172999918460846,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3172999918460846,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.3061999976634979,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.14980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7809000015258789},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.7490000128746033},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6225000023841858},{"id":"https://openalex.org/keywords/stylized-fact","display_name":"Stylized fact","score":0.618399977684021},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5375000238418579},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.39820000529289246},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.39629998803138733},{"id":"https://openalex.org/keywords/test-suite","display_name":"Test suite","score":0.3801000118255615}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7809000015258789},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.7490000128746033},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7487000226974487},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6225000023841858},{"id":"https://openalex.org/C38935604","wikidata":"https://www.wikidata.org/wiki/Q4330363","display_name":"Stylized fact","level":2,"score":0.618399977684021},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5375000238418579},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.39629998803138733},{"id":"https://openalex.org/C151552104","wikidata":"https://www.wikidata.org/wiki/Q7705809","display_name":"Test suite","level":4,"score":0.3801000118255615},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3718999922275543},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.34769999980926514},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.33390000462532043},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.32170000672340393},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.3147999942302704},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.31470000743865967},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30239999294281006},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.2939999997615814},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2809999883174896},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2574000060558319},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.25290000438690186},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.21686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.21686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Interactive":[0],"video":[1],"generation":[2],"models":[3,74,122,221],"such":[4,39,86],"as":[5,40,185],"Genie,":[6],"YUME,":[7],"HY-World,":[8],"and":[9,26,45,61,126,139,143,146,156,167,196,228],"Matrix-Game":[10],"are":[11],"advancing":[12],"rapidly,":[13],"yet":[14],"every":[15],"model":[16,197],"is":[17],"evaluated":[18],"on":[19,123],"its":[20],"own":[21,183],"benchmark":[22,83],"with":[23,75],"private":[24],"scenes":[25,125],"trajectories,":[27],"making":[28],"fair":[29],"cross-model":[30],"comparison":[31,118],"impossible.":[32],"Existing":[33],"public":[34],"benchmarks":[35],"offer":[36],"useful":[37],"metrics":[38,71,184],"trajectory":[41],"error,":[42],"aesthetic":[43],"scores,":[44],"VLM-based":[46],"judgments,":[47],"but":[48],"none":[49],"supplies":[50],"the":[51,81,186,230],"standardized":[52,177],"test":[53,131],"conditions":[54],"--":[55,66],"identical":[56,58,124],"scenes,":[57,145],"action":[59,108],"sequences,":[60],"a":[62,87,99,105,129,158],"unified":[63,100],"control":[64,114],"interface":[65],"needed":[67],"to":[68,152,199],"make":[69],"those":[70],"comparable":[72],"across":[73,119],"heterogeneous":[76],"inputs.":[77],"We":[78,189],"introduce":[79],"WorldMark,":[80],"first":[82],"that":[84,103,172],"provides":[85],"common":[88],"playing":[89],"field":[90,187],"for":[91,162],"interactive":[92],"Image-to-Video":[93],"world":[94,220],"models.":[95],"WorldMark":[96],"contributes:":[97],"(1)":[98],"action-mapping":[101],"layer":[102],"translates":[104],"shared":[106],"WASD-style":[107],"vocabulary":[109],"into":[110],"each":[111,223],"model's":[112],"native":[113],"format,":[115],"enabling":[116],"apples-to-apples":[117],"six":[120],"major":[121],"trajectories;":[127],"(2)":[128],"hierarchical":[130],"suite":[132],"of":[133],"500":[134],"evaluation":[135,160,194],"cases":[136],"covering":[137],"first-":[138],"third-person":[140],"viewpoints,":[141],"photorealistic":[142],"stylized":[144],"three":[147],"difficulty":[148],"tiers":[149],"from":[150],"Easy":[151],"Hard":[153],"spanning":[154],"20-60s;":[155],"(3)":[157],"modular":[159],"toolkit":[161],"Visual":[163],"Quality,":[164],"Control":[165],"Alignment,":[166],"World":[168,208],"Consistency,":[169],"designed":[170],"so":[171],"researchers":[173],"can":[174,217],"reuse":[175],"our":[176],"inputs":[178],"while":[179],"plugging":[180],"in":[181,225],"their":[182],"evolves.":[188],"will":[190],"release":[191],"all":[192],"data,":[193],"code,":[195],"outputs":[198],"facilitate":[200],"future":[201],"research.":[202],"Beyond":[203],"offline":[204],"metrics,":[205],"we":[206],"launch":[207],"Model":[209],"Arena":[210],"(warena.ai),":[211],"an":[212],"online":[213],"platform":[214],"where":[215],"anyone":[216],"pit":[218],"leading":[219],"against":[222],"other":[224],"side-by-side":[226],"battles":[227],"watch":[229],"live":[231],"leaderboard.":[232]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-25T00:00:00"}
