{"id":"https://openalex.org/W4390939369","doi":"https://doi.org/10.1109/tcns.2024.3355035","title":"Payoff-Based Learning of Nash Equilibria in Merely Monotone Games","display_name":"Payoff-Based Learning of Nash Equilibria in Merely Monotone Games","publication_year":2024,"publication_date":"2024-01-17","ids":{"openalex":"https://openalex.org/W4390939369","doi":"https://doi.org/10.1109/tcns.2024.3355035"},"language":"en","primary_location":{"id":"doi:10.1109/tcns.2024.3355035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcns.2024.3355035","pdf_url":null,"source":{"id":"https://openalex.org/S2502544478","display_name":"IEEE Transactions on Control of Network Systems","issn_l":"2325-5870","issn":["2325-5870","2372-2533"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control of Network Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://infoscience.epfl.ch/handle/20.500.14299/242395","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042936048","display_name":"Tatiana Tatarenko","orcid":"https://orcid.org/0000-0001-8951-112X"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tatiana Tatarenko","raw_affiliation_strings":["Department of Control Theory and Robotics, TU Darmstadt, Darmstadt, Germany"],"raw_orcid":"https://orcid.org/0000-0001-8951-112X","affiliations":[{"raw_affiliation_string":"Department of Control Theory and Robotics, TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082009236","display_name":"Maryam Kamgarpour","orcid":"https://orcid.org/0000-0003-0230-3518"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Maryam Kamgarpour","raw_affiliation_strings":["EPFL School of Engineering, Sycamore Lab, Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0003-0230-3518","affiliations":[{"raw_affiliation_string":"EPFL School of Engineering, Sycamore Lab, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1646,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.86829975,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":"11","issue":"4","first_page":"1790","last_page":"1799"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.7573446035385132},{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.5805982351303101},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5570545196533203},{"id":"https://openalex.org/keywords/best-response","display_name":"Best response","score":0.5450690984725952},{"id":"https://openalex.org/keywords/stochastic-game","display_name":"Stochastic game","score":0.5116320252418518},{"id":"https://openalex.org/keywords/monotone-polygon","display_name":"Monotone polygon","score":0.5115845799446106},{"id":"https://openalex.org/keywords/iterated-function","display_name":"Iterated function","score":0.5001423358917236},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.46980318427085876},{"id":"https://openalex.org/keywords/monotonic-function","display_name":"Monotonic function","score":0.4542466104030609},{"id":"https://openalex.org/keywords/risk-dominance","display_name":"Risk dominance","score":0.450364351272583},{"id":"https://openalex.org/keywords/repeated-game","display_name":"Repeated game","score":0.4366745948791504},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.43185582756996155},{"id":"https://openalex.org/keywords/epsilon-equilibrium","display_name":"Epsilon-equilibrium","score":0.41374316811561584},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.41280800104141235},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.37041062116622925}],"concepts":[{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.7573446035385132},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.5805982351303101},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5570545196533203},{"id":"https://openalex.org/C32407928","wikidata":"https://www.wikidata.org/wiki/Q2733833","display_name":"Best response","level":3,"score":0.5450690984725952},{"id":"https://openalex.org/C22171661","wikidata":"https://www.wikidata.org/wiki/Q1074380","display_name":"Stochastic game","level":2,"score":0.5116320252418518},{"id":"https://openalex.org/C2834757","wikidata":"https://www.wikidata.org/wiki/Q4925424","display_name":"Monotone polygon","level":2,"score":0.5115845799446106},{"id":"https://openalex.org/C140479938","wikidata":"https://www.wikidata.org/wiki/Q5254619","display_name":"Iterated function","level":2,"score":0.5001423358917236},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.46980318427085876},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.4542466104030609},{"id":"https://openalex.org/C22349654","wikidata":"https://www.wikidata.org/wiki/Q2039354","display_name":"Risk dominance","level":5,"score":0.450364351272583},{"id":"https://openalex.org/C202556891","wikidata":"https://www.wikidata.org/wiki/Q1584646","display_name":"Repeated game","level":3,"score":0.4366745948791504},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.43185582756996155},{"id":"https://openalex.org/C141824439","wikidata":"https://www.wikidata.org/wiki/Q307521","display_name":"Epsilon-equilibrium","level":4,"score":0.41374316811561584},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.41280800104141235},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.37041062116622925},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcns.2024.3355035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcns.2024.3355035","pdf_url":null,"source":{"id":"https://openalex.org/S2502544478","display_name":"IEEE Transactions on Control of Network Systems","issn_l":"2325-5870","issn":["2325-5870","2372-2533"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control of Network Systems","raw_type":"journal-article"},{"id":"pmh:oai:infoscience.epfl.ch:20.500.14299/242395","is_oa":true,"landing_page_url":"https://infoscience.epfl.ch/handle/20.500.14299/242395","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"research article"}],"best_oa_location":{"id":"pmh:oai:infoscience.epfl.ch:20.500.14299/242395","is_oa":true,"landing_page_url":"https://infoscience.epfl.ch/handle/20.500.14299/242395","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"research article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W183050033","https://openalex.org/W1570963478","https://openalex.org/W1972221945","https://openalex.org/W1972711404","https://openalex.org/W1997949764","https://openalex.org/W2008796819","https://openalex.org/W2014837638","https://openalex.org/W2024612830","https://openalex.org/W2058626062","https://openalex.org/W2066767736","https://openalex.org/W2081316950","https://openalex.org/W2088077079","https://openalex.org/W2125913552","https://openalex.org/W2130772252","https://openalex.org/W2149479912","https://openalex.org/W2157394646","https://openalex.org/W2167598090","https://openalex.org/W2176451521","https://openalex.org/W2484003876","https://openalex.org/W2752505153","https://openalex.org/W2765459668","https://openalex.org/W2888709019","https://openalex.org/W2994637526","https://openalex.org/W3001078900","https://openalex.org/W3028369166","https://openalex.org/W3044550089","https://openalex.org/W4211108990","https://openalex.org/W4213077960","https://openalex.org/W4234067117","https://openalex.org/W4243772471","https://openalex.org/W4285875894","https://openalex.org/W4292064643","https://openalex.org/W4297672569","https://openalex.org/W4301791716","https://openalex.org/W4315489128","https://openalex.org/W4320200866","https://openalex.org/W6651597697","https://openalex.org/W6695508789","https://openalex.org/W6719581826","https://openalex.org/W6755056574","https://openalex.org/W6767052781","https://openalex.org/W6839121823","https://openalex.org/W6840489390"],"related_works":["https://openalex.org/W1853631319","https://openalex.org/W3192122086","https://openalex.org/W4301347782","https://openalex.org/W1554758635","https://openalex.org/W1667857601","https://openalex.org/W1976009178","https://openalex.org/W2013767790","https://openalex.org/W2092374696","https://openalex.org/W4365460918","https://openalex.org/W2904794353"],"abstract_inverted_index":{"We":[0,13,59],"address":[1],"learning":[2,38],"Nash":[3,70],"equilibria":[4],"in":[5,17,72],"convex":[6],"games":[7],"under":[8],"the":[9,15,19,68,76,83,88,101,105,113,118],"payoff":[10],"information":[11],"setting.":[12,74],"consider":[14],"case":[16],"which":[18],"game":[20,52,89],"pseudo-":[21],"gradient":[22],"is":[23],"monotone":[24],"but":[25],"not":[26],"necessarily":[27],"strictly":[28],"monotone.":[29],"This":[30],"relaxation":[31],"of":[32,37,44,78,93,104],"strict":[33],"monotonicity":[34],"enables":[35],"application":[36],"algorithms":[39],"to":[40,67,111,116],"a":[41,50,54,79],"larger":[42],"class":[43],"games,":[45],"such":[46],"as,":[47],"for":[48],"example,":[49],"zero-sum":[51],"with":[53],"merely":[55],"convex-concave":[56],"cost":[57],"function.":[58],"derive":[60],"an":[61,91,109],"algorithm":[62,106],"whose":[63],"iterates":[64],"provably":[65],"converge":[66],"least-norm":[69],"equilibrium":[71],"this":[73,97],"From":[75],"perspective":[77],"single":[80],"player":[81],"using":[82],"proposed":[84],"algorithm,":[85],"we":[86,99],"view":[87],"as":[90],"instance":[92],"online":[94],"optimization.":[95],"Through":[96],"lens,":[98],"quantify":[100],"regret":[102,119],"rate":[103],"and":[107],"provide":[108],"approach":[110],"choose":[112],"algorithm's":[114],"parameters":[115],"minimize":[117],"rate.":[120]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}