{"id":"https://openalex.org/W4312181536","doi":"https://doi.org/10.1007/s10489-022-04249-x","title":"Modeling opponent learning in multiagent repeated games","display_name":"Modeling opponent learning in multiagent repeated games","publication_year":2022,"publication_date":"2022-12-23","ids":{"openalex":"https://openalex.org/W4312181536","doi":"https://doi.org/10.1007/s10489-022-04249-x"},"language":"en","primary_location":{"id":"doi:10.1007/s10489-022-04249-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-04249-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10489-022-04249-x.pdf","source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10489-022-04249-x.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103154700","display_name":"Yudong Hu","orcid":"https://orcid.org/0009-0000-6528-8672"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yudong Hu","raw_affiliation_strings":["School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046469888","display_name":"Congying Han","orcid":"https://orcid.org/0000-0002-3445-4620"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Congying Han","raw_affiliation_strings":["School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100327745","display_name":"Haoran Li","orcid":"https://orcid.org/0000-0003-2559-9585"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoran Li","raw_affiliation_strings":["School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100561359","display_name":"Tiande Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiande Guo","raw_affiliation_strings":["School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, 100049, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103154700"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.689,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.75715956,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"53","issue":"13","first_page":"17194","last_page":"17210"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stackelberg-competition","display_name":"Stackelberg competition","score":0.8183192014694214},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7796654105186462},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7786543369293213},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.7344023585319519},{"id":"https://openalex.org/keywords/fictitious-play","display_name":"Fictitious play","score":0.6170658469200134},{"id":"https://openalex.org/keywords/dilemma","display_name":"Dilemma","score":0.5729768872261047},{"id":"https://openalex.org/keywords/equilibrium-selection","display_name":"Equilibrium selection","score":0.5221046209335327},{"id":"https://openalex.org/keywords/best-response","display_name":"Best response","score":0.5112786293029785},{"id":"https://openalex.org/keywords/repeated-game","display_name":"Repeated game","score":0.492374062538147},{"id":"https://openalex.org/keywords/adversary","display_name":"Adversary","score":0.48884886503219604},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.4682534635066986},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.44183436036109924},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.43717339634895325},{"id":"https://openalex.org/keywords/equilibrium-point","display_name":"Equilibrium point","score":0.41212689876556396},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3902125954627991},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3260830342769623},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.3169749975204468},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.28902941942214966},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11369764804840088}],"concepts":[{"id":"https://openalex.org/C199510392","wikidata":"https://www.wikidata.org/wiki/Q1184602","display_name":"Stackelberg competition","level":2,"score":0.8183192014694214},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7796654105186462},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7786543369293213},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.7344023585319519},{"id":"https://openalex.org/C145071142","wikidata":"https://www.wikidata.org/wiki/Q1411116","display_name":"Fictitious play","level":3,"score":0.6170658469200134},{"id":"https://openalex.org/C2778496695","wikidata":"https://www.wikidata.org/wiki/Q254128","display_name":"Dilemma","level":2,"score":0.5729768872261047},{"id":"https://openalex.org/C164407509","wikidata":"https://www.wikidata.org/wiki/Q5384490","display_name":"Equilibrium selection","level":4,"score":0.5221046209335327},{"id":"https://openalex.org/C32407928","wikidata":"https://www.wikidata.org/wiki/Q2733833","display_name":"Best response","level":3,"score":0.5112786293029785},{"id":"https://openalex.org/C202556891","wikidata":"https://www.wikidata.org/wiki/Q1584646","display_name":"Repeated game","level":3,"score":0.492374062538147},{"id":"https://openalex.org/C41065033","wikidata":"https://www.wikidata.org/wiki/Q2825412","display_name":"Adversary","level":2,"score":0.48884886503219604},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.4682534635066986},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.44183436036109924},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.43717339634895325},{"id":"https://openalex.org/C94766913","wikidata":"https://www.wikidata.org/wiki/Q1530271","display_name":"Equilibrium point","level":3,"score":0.41212689876556396},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3902125954627991},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3260830342769623},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.3169749975204468},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28902941942214966},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11369764804840088},{"id":"https://openalex.org/C78045399","wikidata":"https://www.wikidata.org/wiki/Q11214","display_name":"Differential equation","level":2,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10489-022-04249-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-04249-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10489-022-04249-x.pdf","source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10489-022-04249-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10489-022-04249-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10489-022-04249-x.pdf","source":{"id":"https://openalex.org/S74726891","display_name":"Applied Intelligence","issn_l":"0924-669X","issn":["0924-669X","1573-7497"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1023919524","display_name":null,"funder_award_id":", Grant","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2403571516","display_name":null,"funder_award_id":"11991022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G262448394","display_name":null,"funder_award_id":"XDA27000000","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5616351183","display_name":null,"funder_award_id":"00000","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5873499025","display_name":null,"funder_award_id":"2021YFA1000403","funder_id":"https://openalex.org/F4320335774","funder_display_name":"Key Technologies Research and Development Program"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G622688436","display_name":null,"funder_award_id":"XDA27000000","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"},{"id":"https://openalex.org/G6258415954","display_name":null,"funder_award_id":"Chinese","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7178638761","display_name":null,"funder_award_id":"100040","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"},{"id":"https://openalex.org/F4320335774","display_name":"Key Technologies Research and Development Program","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312181536.pdf","grobid_xml":"https://content.openalex.org/works/W4312181536.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W1540725368","https://openalex.org/W1981276685","https://openalex.org/W2061017563","https://openalex.org/W2070963703","https://openalex.org/W2093074200","https://openalex.org/W2125293595","https://openalex.org/W2130752181","https://openalex.org/W2142850237","https://openalex.org/W2168405694","https://openalex.org/W2174806087","https://openalex.org/W2292533394","https://openalex.org/W2539402368","https://openalex.org/W2620686495","https://openalex.org/W2768629321","https://openalex.org/W2773381986","https://openalex.org/W2902907165","https://openalex.org/W2965394063","https://openalex.org/W2968866862","https://openalex.org/W2979146916","https://openalex.org/W3035964300","https://openalex.org/W3093657173","https://openalex.org/W3106649810","https://openalex.org/W3119115629","https://openalex.org/W3122483313","https://openalex.org/W3123160622","https://openalex.org/W3212204275","https://openalex.org/W4206500519","https://openalex.org/W4210714139","https://openalex.org/W4210773761"],"related_works":["https://openalex.org/W1935632502","https://openalex.org/W2955291419","https://openalex.org/W2080682057","https://openalex.org/W1984394557","https://openalex.org/W2928289619","https://openalex.org/W2328458106","https://openalex.org/W3136807736","https://openalex.org/W2733656312","https://openalex.org/W3106393350","https://openalex.org/W2050089535"],"abstract_inverted_index":{"Abstract":[0],"Multiagent":[1],"reinforcement":[2,202],"learning":[3,43,51,72,203,211],"(MARL)":[4],"has":[5],"been":[6],"used":[7],"extensively":[8],"in":[9,18,85,91,140,159,167,185,200,213],"the":[10,15,22,25,31,41,70,92,102,110,120,182,196,208],"game":[11,151,187],"environment.":[12],"One":[13],"of":[14,24,94,198,210],"main":[16],"challenges":[17],"MARL":[19,214],"is":[20,28,52],"that":[21,135,179],"environment":[23],"agent":[26],"system":[27],"dynamic,":[29],"and":[30,45,67,74,88,126,152,158,174,205,220],"other":[32],"agents":[33],"are":[34],"also":[35],"updating":[36],"their":[37],"strategies.":[38],"Therefore,":[39],"modeling":[40],"opponents\u2019":[42,121],"process":[44,73],"adopting":[46],"specific":[47],"strategies":[48,87],"to":[49,56,118,176,207,215],"shape":[50],"an":[53],"effective":[54,76],"way":[55],"obtain":[57],"better":[58,138],"training":[59],"results.":[60],"Previous":[61],"studies":[62,80],"such":[63],"as":[64],"DRON,":[65],"LOLA":[66],"SOS":[68],"approximated":[69],"opponent\u2019s":[71],"gave":[75],"applications.":[77],"However,":[78],"these":[79],"modeled":[81],"only":[82],"transient":[83],"changes":[84],"opponent":[86,105],"lacked":[89],"stability":[90],"improvement":[93],"equilibrium":[95,129,184,199,219],"efficiency.":[96,223],"In":[97],"this":[98],"article,":[99],"we":[100],"design":[101,209],"MOL":[103,136,164],"(modeling":[104],"learning)":[106],"method":[107],"based":[108],"on":[109],"Stackelberg":[111,149],"game.":[112],"We":[113,133],"use":[114],"best":[115],"response":[116],"theory":[117],"approximate":[119],"preferences":[122],"for":[123,195],"different":[124,172],"actions":[125],"explore":[127],"stable":[128,177],"with":[130,143,155],"higher":[131],"rewards.":[132],"find":[134],"achieves":[137],"results":[139,190],"several":[141],"games":[142,169],"classical":[144],"structures":[145],"(the":[146],"Prisoner\u2019s":[147],"Dilemma,":[148],"Leader":[150],"Stag":[153],"Hunt":[154],"3":[156],"players),":[157],"randomly":[160],"generated":[161],"bimatrix":[162],"games.":[163],"performs":[165],"well":[166],"competitive":[168],"played":[170],"against":[171],"opponents":[173],"converges":[175],"points":[178],"score":[180],"above":[181],"Nash":[183],"repeated":[186],"environments.":[188],"The":[189],"may":[191],"provide":[192],"a":[193],"reference":[194],"definition":[197],"multiagent":[201],"systems,":[204],"contribute":[206],"objectives":[212],"avoid":[216],"local":[217],"disadvantageous":[218],"improve":[221],"general":[222]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
