{"id":"https://openalex.org/W7134965896","doi":"https://doi.org/10.48550/arxiv.2603.09337","title":"Beyond Scaling: Assessing Strategic Reasoning and Rapid Decision-Making Capability of LLMs in Zero-sum Environments","display_name":"Beyond Scaling: Assessing Strategic Reasoning and Rapid Decision-Making Capability of LLMs in Zero-sum Environments","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134965896","doi":"https://doi.org/10.48550/arxiv.2603.09337"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09337","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128792903","display_name":"Yang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128750748","display_name":"Xing Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128711429","display_name":"Yutao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yutao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017490346","display_name":"Gege Qi","orcid":"https://orcid.org/0000-0002-0032-6786"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Gege","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101353649","display_name":"Yanxian Bi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"BI, Yanxian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128789349","display_name":"Zizhe Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zizhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128710409","display_name":"Yunjian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yunjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128745851","display_name":"Yao Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Yao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.3555999994277954,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.3555999994277954,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1468999981880188,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.065700002014637,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/strategic-planning","display_name":"Strategic planning","score":0.5041999816894531},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.42719998955726624},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.4034000039100647},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.3984000086784363},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.39320001006126404},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.366100013256073},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.33739998936653137}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6786999702453613},{"id":"https://openalex.org/C48243021","wikidata":"https://www.wikidata.org/wiki/Q932522","display_name":"Strategic planning","level":2,"score":0.5041999816894531},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.42719998955726624},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.4034000039100647},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.3984000086784363},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.39320001006126404},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35040000081062317},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.33739998936653137},{"id":"https://openalex.org/C152563557","wikidata":"https://www.wikidata.org/wiki/Q7621861","display_name":"Strategic thinking","level":3,"score":0.3337000012397766},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.32989999651908875},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.3095000088214874},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.30059999227523804},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.28839999437332153},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C103423482","wikidata":"https://www.wikidata.org/wiki/Q552515","display_name":"Competitive intelligence","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2567000091075897},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2565999925136566},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.25619998574256897},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6639812588691711}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"achieved":[5],"strong":[6],"performance":[7,173],"on":[8,99,194,199],"static":[9],"reasoning":[10,30,69,195],"benchmarks,":[11],"yet":[12],"their":[13,166],"effectiveness":[14],"as":[15,31,70,146,210],"interactive":[16,189],"agents":[17],"operating":[18],"in":[19,174,188,218],"adversarial,":[20],"time-sensitive":[21],"environments":[22,190],"remains":[23],"poorly":[24],"understood.":[25],"Existing":[26],"evaluations":[27,154],"largely":[28],"treat":[29],"a":[32,56,95,100,104,128,156,211],"single-shot":[33],"capability,":[34],"overlooking":[35],"the":[36,140,200],"challenges":[37],"of":[38,86,142],"opponent-aware":[39],"decision-making,":[40],"temporal":[41],"constraints,":[42],"and":[43,80,90,107,116,149],"execution":[44,93,110,147],"under":[45],"pressure.":[46],"This":[47],"paper":[48],"introduces":[49],"Strategic":[50,129],"Tactical":[51],"Agent":[52],"Reasoning":[53],"(STAR)":[54],"Benchmark,":[55],"multi-agent":[57],"evaluation":[58,115],"framework":[59],"that":[60,132,185],"assesses":[61,133],"LLMs":[62],"through":[63],"1v1":[64],"zero-sum":[65],"competitive":[66,136],"interactions,":[67],"framing":[68],"an":[71],"iterative,":[72],"adaptive":[73],"decision-making":[74],"process.":[75],"STAR":[76,112,209],"supports":[77],"both":[78],"turn-based":[79,164],"real-time":[81,175],"settings,":[82,165],"enabling":[83],"controlled":[84],"analysis":[85],"long-horizon":[87],"strategic":[88,143,186],"planning":[89],"fast-paced":[91],"tactical":[92],"within":[94],"unified":[96],"environment.":[97],"Built":[98],"modular":[101],"architecture":[102],"with":[103],"standardized":[105],"API":[106],"fully":[108],"implemented":[109],"engine,":[111],"facilitates":[113],"reproducible":[114],"flexible":[117],"task":[118],"customization.":[119],"To":[120],"move":[121],"beyond":[122],"binary":[123],"win-loss":[124],"outcomes,":[125],"we":[126],"introduce":[127],"Evaluation":[130],"Suite":[131],"not":[134,192],"only":[135,193],"success":[137],"but":[138,197],"also":[139,198],"quality":[141],"behavior,":[144],"such":[145],"efficiency":[148],"outcome":[150],"stability.":[151],"Extensive":[152],"pairwise":[153],"reveal":[155],"pronounced":[157],"strategy-execution":[158],"gap:":[159],"while":[160],"reasoning-intensive":[161],"models":[162,180],"dominate":[163],"inference":[167],"latency":[168],"often":[169],"leads":[170],"to":[171,202],"inferior":[172],"scenarios,":[176],"where":[177],"faster":[178],"instruction-tuned":[179],"prevail.":[181],"These":[182],"results":[183],"show":[184],"intelligence":[187],"depends":[191],"depth,":[196],"ability":[201],"translate":[203],"plans":[204],"into":[205],"timely":[206],"actions,":[207],"positioning":[208],"principled":[212],"benchmark":[213],"for":[214],"studying":[215],"this":[216],"trade-off":[217],"competitive,":[219],"dynamic":[220],"settings.":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-12T00:00:00"}
