{"id":"https://openalex.org/W4405304327","doi":"https://doi.org/10.1109/tnnls.2024.3457509","title":"Purified Policy Space Response Oracles for Symmetric Zero-Sum Games","display_name":"Purified Policy Space Response Oracles for Symmetric Zero-Sum Games","publication_year":2024,"publication_date":"2024-12-12","ids":{"openalex":"https://openalex.org/W4405304327","doi":"https://doi.org/10.1109/tnnls.2024.3457509","pmid":"https://pubmed.ncbi.nlm.nih.gov/40030521"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2024.3457509","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3457509","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072366496","display_name":"Zhengdao Shao","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhengdao Shao","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044163181","display_name":"Liansheng Zhuang","orcid":"https://orcid.org/0000-0002-4345-856X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liansheng Zhuang","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073135795","display_name":"Yihong Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihong Huang","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Houqiang Li","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China (USTC), Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041312010","display_name":"Shafei Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shafei Wang","raw_affiliation_strings":["Pengcheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Pengcheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5072366496"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.4907,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.72062262,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"6","first_page":"11258","last_page":"11270"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9172999858856201,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9172999858856201,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10927","display_name":"Access Control and Trust","score":0.9111999869346619,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.6505255699157715},{"id":"https://openalex.org/keywords/zero-sum-game","display_name":"Zero-sum game","score":0.5734665989875793},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.49409177899360657},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4678574204444885},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.4145326614379883},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3934248685836792},{"id":"https://openalex.org/keywords/pure-mathematics","display_name":"Pure mathematics","score":0.35903775691986084},{"id":"https://openalex.org/keywords/algebra-over-a-field","display_name":"Algebra over a field","score":0.3292461931705475},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.32090193033218384},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.2979964017868042},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.17624735832214355},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.08990654349327087},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.059488147497177124}],"concepts":[{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.6505255699157715},{"id":"https://openalex.org/C136356330","wikidata":"https://www.wikidata.org/wiki/Q156612","display_name":"Zero-sum game","level":3,"score":0.5734665989875793},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.49409177899360657},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4678574204444885},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.4145326614379883},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3934248685836792},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.35903775691986084},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.3292461931705475},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.32090193033218384},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.2979964017868042},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.17624735832214355},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.08990654349327087},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.059488147497177124},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2024.3457509","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3457509","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:40030521","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40030521","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Climate action","id":"https://metadata.un.org/sdg/13"}],"awards":[{"id":"https://openalex.org/G2203821447","display_name":null,"funder_award_id":"U20B2070","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3146671063","display_name":null,"funder_award_id":"61976199","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1675187506","https://openalex.org/W1991624978","https://openalex.org/W2124191651","https://openalex.org/W2130406232","https://openalex.org/W2167957526","https://openalex.org/W2168281471","https://openalex.org/W2810602713","https://openalex.org/W2960876848","https://openalex.org/W2964381205","https://openalex.org/W2976996772","https://openalex.org/W2982316857","https://openalex.org/W3015082424","https://openalex.org/W3016722131","https://openalex.org/W3110979110","https://openalex.org/W4297964528","https://openalex.org/W4310705874","https://openalex.org/W4322706754","https://openalex.org/W4385194705","https://openalex.org/W4385565498","https://openalex.org/W4389170216","https://openalex.org/W4392405470","https://openalex.org/W4392903915","https://openalex.org/W4401023795","https://openalex.org/W6637967152","https://openalex.org/W6676957253","https://openalex.org/W6681187623","https://openalex.org/W6685659016","https://openalex.org/W6696772115","https://openalex.org/W6735641298","https://openalex.org/W6743367460","https://openalex.org/W6746177919","https://openalex.org/W6755963907","https://openalex.org/W6758729514","https://openalex.org/W6771904302","https://openalex.org/W6772005887","https://openalex.org/W6775289199","https://openalex.org/W6775695405","https://openalex.org/W6776645179","https://openalex.org/W6780162350","https://openalex.org/W6780812528","https://openalex.org/W6788109975","https://openalex.org/W6796742507","https://openalex.org/W6797070888","https://openalex.org/W6803852615","https://openalex.org/W6810580173","https://openalex.org/W6852774576","https://openalex.org/W6854295251"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W3013650182","https://openalex.org/W2989283631","https://openalex.org/W2739681863","https://openalex.org/W3170723600","https://openalex.org/W4287122294","https://openalex.org/W2039187327","https://openalex.org/W4307291161","https://openalex.org/W1877069894","https://openalex.org/W1994737592"],"abstract_inverted_index":{"Policy":[0],"space":[1],"response":[2,114],"oracles":[3],"(PSRO)":[4],"is":[5,117],"a":[6,17,28,33,52,96,121,212],"promising":[7],"tool":[8],"to":[9,119,128,172],"find":[10],"an":[11,168],"approximate":[12,40,106],"Nash":[13],"equilibrium":[14,24],"(NE)":[15],"in":[16],"two-player":[18],"zero-sum":[19],"game.":[20],"It":[21],"solves":[22],"the":[23,44,65,70,130,144,147,153,160,178,182,185],"by":[25,32,101],"iteratively":[26],"expanding":[27],"small-scale":[29],"meta-game":[30],"formed":[31,100],"restricted":[34],"strategy":[35,71,98,103,123,131,148],"population":[36,99,132],"consisting":[37],"of":[38,43,69,105,146,155,162,181,194],"historical":[39],"best":[41,49,107],"responses":[42,50],"meta-games.":[45],"However,":[46],"since":[47],"these":[48],"have":[51,64],"strong":[53],"correlation":[54],"with":[55,125,211],"each":[56,134],"other,":[57],"existing":[58,207],"PSRO":[59,140,203],"and":[60,73,80,176,197],"its":[61],"variants":[62],"often":[63],"slow":[66,81],"diversity":[67,145],"growth":[68],"population,":[72,149],"thus":[74,150],"suffer":[75],"from":[76],"poor":[77],"exploration":[78],"efficiency":[79,154],"convergence":[82,161],"rate.":[83],"To":[84],"address":[85],"this":[86,88,137],"problem,":[87],"article":[89],"proposes":[90],"Purified":[91,139,163,202],"PSRO,":[92],"which":[93],"deliberately":[94],"maintains":[95],"pure":[97,102,122],"bases":[104],"responses.":[108],"A":[109],"novel":[110],"module":[111,171],"namely":[112],"non-best":[113],"suppression":[115],"(NBRS)":[116],"introduced":[118],"calculate":[120],"base":[124],"better":[126],"orthogonality":[127],"expand":[129],"at":[133],"epoch.":[135],"In":[136],"way,":[138],"can":[141,204],"quickly":[142],"increase":[143],"greatly":[151],"enhance":[152],"exploration.":[156],"Theoretically,":[157],"we":[158,166],"prove":[159],"PSRO.":[164],"Moreover,":[165],"introduce":[167],"early":[169],"stop":[170],"reduce":[173],"computation":[174],"cost,":[175],"give":[177],"upper":[179],"bound":[180],"exploitability":[183],"when":[184],"algorithm":[186],"stops":[187],"early.":[188],"Extensive":[189],"experiments":[190],"on":[191],"random":[192],"games":[193],"skill":[195],"(RGoS)":[196],"real-world":[198],"meta-games":[199],"show":[200],"that":[201],"consistently":[205],"outperform":[206],"SOTA":[208],"methods,":[209],"sometimes":[210],"large":[213],"margin.":[214]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
