{"id":"https://openalex.org/W7163006453","doi":"https://doi.org/10.48550/arxiv.2605.31529","title":"SVI-Bench: A Dynamic Microworld for Strategic Video Intelligence","display_name":"SVI-Bench: A Dynamic Microworld for Strategic Video Intelligence","publication_year":2026,"publication_date":"2026-05-29","ids":{"openalex":"https://openalex.org/W7163006453","doi":"https://doi.org/10.48550/arxiv.2605.31529"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.31529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.31529","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137518280","display_name":"Yulu Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Yulu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100738287","display_name":"Yi Han","orcid":"https://orcid.org/0000-0001-6847-7559"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi, Han","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137594988","display_name":"Seongsu Ha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ha, Seongsu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101463748","display_name":"Md Mohaiminul Islam","orcid":"https://orcid.org/0000-0003-3338-8614"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Islam, Md Mohaiminul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137554828","display_name":"Benjamin Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082736347","display_name":"Lorenzo Torresani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Torresani, Lorenzo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5081800468","display_name":"Gedas Bertasius","orcid":"https://orcid.org/0000-0003-1800-4790"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bertasius, Gedas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2483000010251999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2483000010251999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1467999964952469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.06949999928474426,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6133000254631042},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5422000288963318},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5364000201225281},{"id":"https://openalex.org/keywords/verisimilitude","display_name":"Verisimilitude","score":0.4471000134944916},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.41019999980926514},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.3750999867916107},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.3529999852180481},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.34380000829696655},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.32190001010894775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7357000112533569},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6133000254631042},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5468999743461609},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5422000288963318},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5364000201225281},{"id":"https://openalex.org/C2777175534","wikidata":"https://www.wikidata.org/wiki/Q222288","display_name":"Verisimilitude","level":2,"score":0.4471000134944916},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.41019999980926514},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40209999680519104},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37599998712539673},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.3750999867916107},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.3529999852180481},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.34380000829696655},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3407000005245209},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.32190001010894775},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.3206000030040741},{"id":"https://openalex.org/C2778542649","wikidata":"https://www.wikidata.org/wiki/Q4443415","display_name":"Strategic intelligence","level":2,"score":0.3167000114917755},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.3165000081062317},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.30640000104904175},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.30090001225471497},{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.28790000081062317},{"id":"https://openalex.org/C517642484","wikidata":"https://www.wikidata.org/wiki/Q2388514","display_name":"Intelligence analysis","level":2,"score":0.2824000120162964},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.2809999883174896},{"id":"https://openalex.org/C33009525","wikidata":"https://www.wikidata.org/wiki/Q208841","display_name":"Coevolution","level":2,"score":0.267300009727478},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.266400009393692},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.31529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.31529","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31529","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5613837242126465,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"True":[0],"video":[1],"intelligence":[2],"demands":[3],"more":[4],"than":[5],"recognizing":[6],"what":[7,18,26],"is":[8],"visible:":[9],"it":[10],"requires":[11],"reasoning":[12,39],"about":[13],"why":[14],"events":[15],"unfold,":[16],"predicting":[17],"would":[19],"change":[20],"under":[21,108],"different":[22],"conditions,":[23],"and":[24,40,65,117,139,147,183,189,234],"deciding":[25],"to":[27,32,42,231],"do":[28],"next.":[29],"We":[30,165],"refer":[31],"this":[33,54,80],"progression,":[34],"from":[35],"perception":[36],"through":[37],"causal":[38,64],"simulation":[41],"strategic":[43,66],"planning,":[44],"as":[45,92],"Strategic":[46,181],"Video":[47],"Intelligence":[48],"(SVI).":[49],"No":[50],"existing":[51],"benchmark":[52,87],"evaluates":[53],"capability":[55,195],"stack:":[56],"in-the-wild":[57],"videos":[58],"lack":[59],"verifiable":[60],"ground":[61],"truth":[62],"for":[63],"questions,":[67],"while":[68],"synthetic":[69],"environments":[70],"sacrifice":[71],"the":[72,97,112,222],"complexity":[73,98],"of":[74,99,114,125,133,240],"real":[75],"multi-agent":[76,101],"systems.":[77],"To":[78],"bridge":[79],"gap,":[81],"we":[82,192],"introduce":[83],"SVI-Bench,":[84],"a":[85,93,152,161,172,194,238],"large-scale":[86],"that":[88,155],"leverages":[89],"team":[90],"sports":[91],"dynamic":[94],"microworld,":[95],"combining":[96],"real-world":[100],"interaction":[102],"(10-22":[103],"agents":[104],"making":[105],"coordinated":[106],"decisions":[107],"adversarial":[109],"pressure)":[110],"with":[111],"verifiability":[113],"explicit":[115],"rules":[116],"definitive":[118],"outcomes.":[119],"SVI-Bench":[120],"comprises":[121],"approximately":[122,204],"35K":[123],"hours":[124,132],"broadcast":[126],"video,":[127],"15M":[128],"annotated":[129],"actions,":[130],"15K":[131],"expert":[134],"commentary,":[135],"23K":[136],"game":[137,158],"reports,":[138],"103K":[140],"structured":[141],"statistical":[142],"records":[143],"across":[144,237],"basketball,":[145],"soccer,":[146],"hockey,":[148],"all":[149],"constructed":[150],"via":[151],"data":[153,159],"engine":[154],"transforms":[156],"raw":[157],"into":[160,168],"dense,":[162],"cross-referenced":[163],"corpus.":[164],"organize":[166],"evaluation":[167],"9":[169],"tasks":[170,219],"spanning":[171],"progressive":[173],"four-pillar":[174],"hierarchy:":[175],"Dynamic":[176],"Scene":[177],"Understanding,":[178],"Causal":[179],"Reasoning,":[180],"Simulation,":[182],"Agentic":[184,218],"Synthesis.":[185],"Evaluating":[186],"strong":[187],"multimodal":[188],"agentic":[190],"baselines,":[191],"find":[193],"cliff:":[196],"models":[197],"perform":[198],"competently":[199],"on":[200,206],"perceptual":[201],"tasks,":[202],"achieving":[203],"73%":[205],"fine-grained":[207],"action":[208],"QA,":[209],"but":[210],"degrade":[211],"sharply":[212],"at":[213],"each":[214],"successive":[215],"cognitive":[216],"level.":[217],"prove":[220],"hardest:":[221],"strongest":[223],"model":[224],"achieves":[225],"only":[226],"5%":[227],"accuracy":[228],"when":[229],"required":[230],"autonomously":[232],"gather":[233],"integrate":[235],"evidence":[236],"corpus":[239],"1.8M":[241],"clips.":[242]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-06-02T00:00:00"}
