{"id":"https://openalex.org/W4409225579","doi":"https://doi.org/10.1109/tnnls.2025.3550827","title":"Distributed Policy Space Response Oracles in Two-Player Zero-Sum Games","display_name":"Distributed Policy Space Response Oracles in Two-Player Zero-Sum Games","publication_year":2025,"publication_date":"2025-04-07","ids":{"openalex":"https://openalex.org/W4409225579","doi":"https://doi.org/10.1109/tnnls.2025.3550827","pmid":"https://pubmed.ncbi.nlm.nih.gov/40193259"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2025.3550827","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2025.3550827","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077477958","display_name":"Hongsong Tang","orcid":"https://orcid.org/0000-0002-1366-3749"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongsong Tang","raw_affiliation_strings":["School of Science, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Science, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111492686","display_name":"Yingzhuo Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingzhuo Liu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021357065","display_name":"Lionel M. Ni","orcid":"https://orcid.org/0000-0002-2325-6215"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Letian Ni","raw_affiliation_strings":["School of Science, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Science, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077408167","display_name":"Liuyu Xiang","orcid":"https://orcid.org/0000-0001-8486-6255"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liuyu Xiang","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090073634","display_name":"Yaodong Yang","orcid":"https://orcid.org/0000-0001-8132-5613"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaodong Yang","raw_affiliation_strings":["Institute for Artificial Intelligence, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute for Artificial Intelligence, Peking University, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061290890","display_name":"Ke Bi","orcid":"https://orcid.org/0000-0002-3357-5754"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Bi","raw_affiliation_strings":["School of Science, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Science, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057318866","display_name":"Zhaofeng He","orcid":"https://orcid.org/0000-0002-3433-8435"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaofeng He","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5077477958"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08724798,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"36","issue":"6","first_page":"9893","last_page":"9904"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10927","display_name":"Access Control and Trust","score":0.9264000058174133,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10927","display_name":"Access Control and Trust","score":0.9264000058174133,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.7220908999443054},{"id":"https://openalex.org/keywords/zero-sum-game","display_name":"Zero-sum game","score":0.6370576620101929},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5485292077064514},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.45489567518234253},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4489143490791321},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.4009222984313965},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.3276323676109314},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.32682764530181885},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.2871226668357849},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0552082359790802}],"concepts":[{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.7220908999443054},{"id":"https://openalex.org/C136356330","wikidata":"https://www.wikidata.org/wiki/Q156612","display_name":"Zero-sum game","level":3,"score":0.6370576620101929},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5485292077064514},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.45489567518234253},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4489143490791321},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.4009222984313965},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.3276323676109314},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.32682764530181885},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.2871226668357849},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0552082359790802},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2025.3550827","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2025.3550827","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:40193259","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40193259","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.44999998807907104,"display_name":"Climate action"}],"awards":[{"id":"https://openalex.org/G2115728724","display_name":null,"funder_award_id":"JQ22010","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G2805850703","display_name":null,"funder_award_id":"62206012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4800139155","display_name":null,"funder_award_id":"62301066","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6278709589","display_name":null,"funder_award_id":"U2241243","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8361507201","display_name":null,"funder_award_id":"62176025","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G858523971","display_name":null,"funder_award_id":"2023RC72","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G8709529125","display_name":null,"funder_award_id":"U21B2045","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2295179707","https://openalex.org/W2617547828","https://openalex.org/W2982316857","https://openalex.org/W3096726323","https://openalex.org/W4286748781","https://openalex.org/W4296546847","https://openalex.org/W4297964528","https://openalex.org/W4401023795","https://openalex.org/W4405304327","https://openalex.org/W6604092932","https://openalex.org/W6676957253","https://openalex.org/W6741002519","https://openalex.org/W6743367460","https://openalex.org/W6744537943","https://openalex.org/W6746177919","https://openalex.org/W6748554570","https://openalex.org/W6748638692","https://openalex.org/W6748672522","https://openalex.org/W6758729514","https://openalex.org/W6769580333","https://openalex.org/W6771312369","https://openalex.org/W6773329755","https://openalex.org/W6775695405","https://openalex.org/W6780812528","https://openalex.org/W6785535465","https://openalex.org/W6789083056","https://openalex.org/W6790900645","https://openalex.org/W6791661883","https://openalex.org/W6797070888","https://openalex.org/W6799873116","https://openalex.org/W6800877681","https://openalex.org/W6803116530","https://openalex.org/W6803644465","https://openalex.org/W6810580173","https://openalex.org/W6850383713","https://openalex.org/W6854295251","https://openalex.org/W6868817401","https://openalex.org/W6871666476","https://openalex.org/W6874788513"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W3013650182","https://openalex.org/W2739681863","https://openalex.org/W3170723600","https://openalex.org/W4287122294","https://openalex.org/W2039187327","https://openalex.org/W4307291161","https://openalex.org/W1877069894","https://openalex.org/W1994737592","https://openalex.org/W2092048262"],"abstract_inverted_index":{"Policy":[0],"space":[1],"response":[2],"oracle":[3],"(PSRO)":[4],"is":[5,26,48],"a":[6,175,207],"population-based":[7],"algorithm":[8],"that":[9],"can":[10],"be":[11],"used":[12],"to":[13,74,135,181],"solve":[14,76],"two-player":[15],"zero-sum":[16],"games.":[17],"In":[18,42,67],"the":[19,34,97,100,131,141,155,183,186,193,198,203],"PSRO":[20,59,73],"solution":[21],"framework,":[22],"optimizing":[23],"policy":[24,101],"diversity":[25,82,137,145],"crucial":[27],"for":[28],"addressing":[29],"nontransitive":[30,176],"game":[31,54,78],"problems,":[32],"helping":[33],"agent":[35],"population":[36],"avoid":[37],"exploitation":[38],"by":[39,120,163],"unfamiliar":[40],"opponents.":[41],"addition,":[43],"while":[44,83],"deep":[45],"reinforcement":[46],"learning":[47],"highly":[49],"effective":[50,65,113],"in":[51,64,206],"solving":[52],"complex":[53,77],"environments,":[55],"its":[56],"integration":[57],"with":[58,123],"remains":[60],"fragmented":[61],"and":[62,95,179,195,202],"lacking":[63],"coordination.":[66],"this":[68],"study,":[69],"we":[70,87,153,191],"propose":[71],"distributed":[72,125,132,199],"efficiently":[75],"scenarios.":[79],"To":[80],"enhance":[81],"managing":[84],"optimization":[85,146],"costs,":[86],"introduce":[88,154],"TOP-K":[89,187],"truncation,":[90],"which":[91,160],"prioritizes":[92],"high-quality":[93],"opponents":[94],"limits":[96],"size":[98],"of":[99,185,197],"pool":[102],"during":[103,167],"sampling.":[104,169],"This":[105],"approach":[106,205],"not":[107],"only":[108],"reduces":[109],"interference":[110],"from":[111],"less":[112],"strategies":[114],"but":[115],"also":[116,129],"ensures":[117],"computational":[118,150],"efficiency":[119,196],"seamlessly":[121],"integrating":[122],"our":[124],"training":[126,133,200],"framework.":[127],"We":[128,170],"design":[130],"framework":[134,201],"incorporate":[136],"estimation":[138],"directly":[139],"into":[140],"sampling":[142],"process,":[143],"achieving":[144],"without":[147],"incurring":[148],"additional":[149],"overhead.":[151],"Furthermore,":[152],"opponent":[156,165],"first":[157],"(OF)":[158],"method,":[159],"enhances":[161],"decision-making":[162],"leveraging":[164],"information":[166],"interaction":[168],"perform":[171],"experimental":[172],"validation":[173],"using":[174],"mixture":[177],"model":[178],"AlphaStar888":[180],"confirm":[182],"effectiveness":[184],"truncation":[188],"approach.":[189],"Finally,":[190],"demonstrate":[192],"feasibility":[194],"OF":[204],"Google":[208],"Research":[209],"Football":[210],"11":[211,213],"versus":[212],"scenario.":[214]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
