{"id":"https://openalex.org/W3208215078","doi":"https://doi.org/10.1137/20m1360700","title":"Mean-Field Controls with Q-Learning for Cooperative MARL: Convergence and Complexity Analysis","display_name":"Mean-Field Controls with Q-Learning for Cooperative MARL: Convergence and Complexity Analysis","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3208215078","doi":"https://doi.org/10.1137/20m1360700","mag":"3208215078"},"language":"en","primary_location":{"id":"doi:10.1137/20m1360700","is_oa":true,"landing_page_url":"https://doi.org/10.1137/20m1360700","pdf_url":"https://epubs.siam.org/doi/pdf/10.1137/20M1360700","source":{"id":"https://openalex.org/S4210229561","display_name":"SIAM Journal on Mathematics of Data Science","issn_l":"2577-0187","issn":["2577-0187"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Mathematics of Data Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://epubs.siam.org/doi/pdf/10.1137/20M1360700","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047850847","display_name":"Haotian Gu","orcid":"https://orcid.org/0000-0002-0268-7147"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Haotian Gu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085674806","display_name":"Xin Guo","orcid":"https://orcid.org/0000-0002-3350-4606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xin Guo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007953835","display_name":"Xiaoli Wei","orcid":"https://orcid.org/0000-0002-4787-2856"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaoli Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068576165","display_name":"Renyuan Xu","orcid":"https://orcid.org/0000-0003-4293-3450"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Renyuan Xu","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0003-4293-3450","affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047850847"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.469,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.92916999,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"3","issue":"4","first_page":"1168","last_page":"1196"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14083","display_name":"Extremum Seeking Control Systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14083","display_name":"Extremum Seeking Control Systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6369935274124146},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6292872428894043},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.530663788318634},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.51519376039505},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.461595743894577},{"id":"https://openalex.org/keywords/subject","display_name":"Subject (documents)","score":0.4253700375556946},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.39918339252471924},{"id":"https://openalex.org/keywords/mathematics-education","display_name":"Mathematics education","score":0.32180771231651306},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30283427238464355},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2460656464099884},{"id":"https://openalex.org/keywords/library-science","display_name":"Library science","score":0.23878705501556396},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21841105818748474},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18345603346824646},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.07590523362159729}],"concepts":[{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6369935274124146},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6292872428894043},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.530663788318634},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.51519376039505},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.461595743894577},{"id":"https://openalex.org/C2777855551","wikidata":"https://www.wikidata.org/wiki/Q12310021","display_name":"Subject (documents)","level":2,"score":0.4253700375556946},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.39918339252471924},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.32180771231651306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30283427238464355},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2460656464099884},{"id":"https://openalex.org/C161191863","wikidata":"https://www.wikidata.org/wiki/Q199655","display_name":"Library science","level":1,"score":0.23878705501556396},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21841105818748474},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18345603346824646},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.07590523362159729},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1137/20m1360700","is_oa":true,"landing_page_url":"https://doi.org/10.1137/20m1360700","pdf_url":"https://epubs.siam.org/doi/pdf/10.1137/20M1360700","source":{"id":"https://openalex.org/S4210229561","display_name":"SIAM Journal on Mathematics of Data Science","issn_l":"2577-0187","issn":["2577-0187"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Mathematics of Data Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1137/20m1360700","is_oa":true,"landing_page_url":"https://doi.org/10.1137/20m1360700","pdf_url":"https://epubs.siam.org/doi/pdf/10.1137/20M1360700","source":{"id":"https://openalex.org/S4210229561","display_name":"SIAM Journal on Mathematics of Data Science","issn_l":"2577-0187","issn":["2577-0187"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Mathematics of Data Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3208215078.pdf","grobid_xml":"https://content.openalex.org/works/W3208215078.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W15601695","https://openalex.org/W565357261","https://openalex.org/W1550698229","https://openalex.org/W1552830313","https://openalex.org/W1557517019","https://openalex.org/W1569313452","https://openalex.org/W1946137962","https://openalex.org/W1975228357","https://openalex.org/W1983321045","https://openalex.org/W1987866956","https://openalex.org/W2011000015","https://openalex.org/W2032916024","https://openalex.org/W2038686546","https://openalex.org/W2064778949","https://openalex.org/W2088595989","https://openalex.org/W2117355432","https://openalex.org/W2118556122","https://openalex.org/W2118686230","https://openalex.org/W2119062437","https://openalex.org/W2121863487","https://openalex.org/W2148024708","https://openalex.org/W2160698719","https://openalex.org/W2257979135","https://openalex.org/W2402143959","https://openalex.org/W2568938645","https://openalex.org/W2593952959","https://openalex.org/W2736601468","https://openalex.org/W2785315072","https://openalex.org/W2788125442","https://openalex.org/W2797811993","https://openalex.org/W2902676408","https://openalex.org/W2949608212","https://openalex.org/W2950163914","https://openalex.org/W2962764167","https://openalex.org/W2962856092","https://openalex.org/W2963293760","https://openalex.org/W2963617451","https://openalex.org/W2970875146","https://openalex.org/W2981038142","https://openalex.org/W2991046523","https://openalex.org/W2996026485","https://openalex.org/W3033842056","https://openalex.org/W3035903830","https://openalex.org/W3048890299","https://openalex.org/W3110309042","https://openalex.org/W3195511071","https://openalex.org/W4230510522","https://openalex.org/W4245296547"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4388258507","https://openalex.org/W2392013855","https://openalex.org/W4318064328","https://openalex.org/W2357926602","https://openalex.org/W2374569605","https://openalex.org/W2386062718","https://openalex.org/W899618282","https://openalex.org/W2386129765","https://openalex.org/W2368742525"],"abstract_inverted_index":{"Related":[0],"DatabasesWeb":[1],"of":[2],"Science":[3],"You":[4],"must":[5],"be":[6],"logged":[7],"in":[8],"with":[9],"an":[10],"active":[11],"subscription":[12],"to":[13],"view":[14],"this.Article":[15],"DataHistorySubmitted:":[16],"15":[17],"October":[18,25],"2020Accepted:":[19],"16":[20],"August":[21],"2021Published":[22],"online:":[23],"28":[24],"2021Keywordsmean-field":[26],"control,":[27],"multi-agent":[28],"reinforcement":[29],"learning,":[30],"Q-learning,":[31],"cooperative":[32],"games,":[33],"dynamic":[34],"programming":[35],"principleAMS":[36],"Subject":[37],"Headings49N80,":[38],"68Q32,":[39],"68T05,":[40],"90C40Publication":[41],"DataISSN":[42],"(online):":[43],"2577-0187Publisher:":[44],"Society":[45],"for":[46],"Industrial":[47],"and":[48],"Applied":[49],"MathematicsCODEN:":[50],"sjmdaq":[51]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
