{"id":"https://openalex.org/W3188155443","doi":"https://doi.org/10.24963/ijcai.2021/50","title":"Mean Field Games Flock! The Reinforcement Learning Way","display_name":"Mean Field Games Flock! The Reinforcement Learning Way","publication_year":2021,"publication_date":"2021-08-01","ids":{"openalex":"https://openalex.org/W3188155443","doi":"https://doi.org/10.24963/ijcai.2021/50","mag":"3188155443"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2021/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2021/50","pdf_url":"https://www.ijcai.org/proceedings/2021/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.ijcai.org/proceedings/2021/0050.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031705919","display_name":"Sarah Perrin","orcid":"https://orcid.org/0000-0002-4488-6689"},"institutions":[{"id":"https://openalex.org/I7454413","display_name":"\u00c9cole Centrale de Lille","ror":"https://ror.org/01x441g73","country_code":"FR","type":"education","lineage":["https://openalex.org/I7454413"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Sarah Perrin","raw_affiliation_strings":["Univ. Lille, CNRS, Inria, Centrale Lille, UMR 9189 CRIStAL"],"affiliations":[{"raw_affiliation_string":"Univ. Lille, CNRS, Inria, Centrale Lille, UMR 9189 CRIStAL","institution_ids":["https://openalex.org/I7454413"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027824441","display_name":"Mathieu Lauri\u00e8re","orcid":"https://orcid.org/0000-0002-4380-1399"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mathieu Lauri\u00e8re","raw_affiliation_strings":["Princeton University, ORFE"],"affiliations":[{"raw_affiliation_string":"Princeton University, ORFE","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056707583","display_name":"Julien P\u00e9rolat","orcid":"https://orcid.org/0000-0002-8176-1666"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Julien P\u00e9rolat","raw_affiliation_strings":["DeepMind Paris"],"affiliations":[{"raw_affiliation_string":"DeepMind Paris","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110482875","display_name":"Matthieu Geist","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113520","display_name":"Brain (Germany)","ror":"https://ror.org/01gamcy45","country_code":"DE","type":"company","lineage":["https://openalex.org/I4210113520"]},{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Matthieu Geist","raw_affiliation_strings":["Google Research, Brain Team"],"affiliations":[{"raw_affiliation_string":"Google Research, Brain Team","institution_ids":["https://openalex.org/I1291425158","https://openalex.org/I4210113520"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085971810","display_name":"Romuald \u00c9lie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Romuald \u00c9lie","raw_affiliation_strings":["Deepmind Paris","DeepMind Paris"],"affiliations":[{"raw_affiliation_string":"Deepmind Paris","institution_ids":["https://openalex.org/I4210090411"]},{"raw_affiliation_string":"DeepMind Paris","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065100569","display_name":"Olivier Pietquin","orcid":"https://orcid.org/0000-0002-5386-465X"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113520","display_name":"Brain (Germany)","ror":"https://ror.org/01gamcy45","country_code":"DE","type":"company","lineage":["https://openalex.org/I4210113520"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Olivier Pietquin","raw_affiliation_strings":["Google Research, Brain Team"],"affiliations":[{"raw_affiliation_string":"Google Research, Brain Team","institution_ids":["https://openalex.org/I1291425158","https://openalex.org/I4210113520"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5031705919"],"corresponding_institution_ids":["https://openalex.org/I7454413"],"apc_list":null,"apc_paid":null,"fwci":2.62112995,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.8931855,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"356","last_page":"362"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11764","display_name":"Evolution and Genetic Dynamics","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11764","display_name":"Evolution and Genetic Dynamics","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10621","display_name":"Gene Regulatory Network Analysis","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10482","display_name":"Mathematical and Theoretical Epidemiology and Ecology Models","score":0.9861000180244446,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/flocking","display_name":"Flocking (texture)","score":0.9689575433731079},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8135931491851807},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.6592963337898254},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.642423689365387},{"id":"https://openalex.org/keywords/flock","display_name":"Flock","score":0.6243552565574646},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.5969986319541931},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4914325475692749},{"id":"https://openalex.org/keywords/fictitious-play","display_name":"Fictitious play","score":0.48696503043174744},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4584486186504364},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27967381477355957},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.11795833706855774}],"concepts":[{"id":"https://openalex.org/C2781220375","wikidata":"https://www.wikidata.org/wiki/Q814208","display_name":"Flocking (texture)","level":2,"score":0.9689575433731079},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8135931491851807},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.6592963337898254},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.642423689365387},{"id":"https://openalex.org/C134215735","wikidata":"https://www.wikidata.org/wiki/Q120997","display_name":"Flock","level":2,"score":0.6243552565574646},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.5969986319541931},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4914325475692749},{"id":"https://openalex.org/C145071142","wikidata":"https://www.wikidata.org/wiki/Q1411116","display_name":"Fictitious play","level":3,"score":0.48696503043174744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4584486186504364},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27967381477355957},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.11795833706855774},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2021/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2021/50","pdf_url":"https://www.ijcai.org/proceedings/2021/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2021/50","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2021/50","pdf_url":"https://www.ijcai.org/proceedings/2021/0050.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirtieth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3188155443.pdf","grobid_xml":"https://content.openalex.org/works/W3188155443.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W1015133923","https://openalex.org/W1771410628","https://openalex.org/W1968154464","https://openalex.org/W2016775936","https://openalex.org/W2095257746","https://openalex.org/W2103714988","https://openalex.org/W2150312211","https://openalex.org/W2155027007","https://openalex.org/W2173248099","https://openalex.org/W2750605955","https://openalex.org/W2781726626","https://openalex.org/W2786314843","https://openalex.org/W2799183551","https://openalex.org/W2902907165","https://openalex.org/W2903583264","https://openalex.org/W2921843114","https://openalex.org/W2945395894","https://openalex.org/W2963090522","https://openalex.org/W2963864421","https://openalex.org/W2968203283","https://openalex.org/W2992005611","https://openalex.org/W2995185709","https://openalex.org/W2997345668","https://openalex.org/W3016115703","https://openalex.org/W3025729845","https://openalex.org/W3039107284","https://openalex.org/W4287727431","https://openalex.org/W4297789683","https://openalex.org/W4311549306","https://openalex.org/W6610566761","https://openalex.org/W6675328540","https://openalex.org/W6847073524","https://openalex.org/W7074691498"],"related_works":["https://openalex.org/W2091794545","https://openalex.org/W2085338444","https://openalex.org/W2796348713","https://openalex.org/W2317978638","https://openalex.org/W4214835929","https://openalex.org/W4226086326","https://openalex.org/W4287180847","https://openalex.org/W3119014777","https://openalex.org/W3188155443","https://openalex.org/W1570906179"],"abstract_inverted_index":{"We":[0,35,95,119],"present":[1],"a":[2,5,19,40,68,79],"method":[3],"enabling":[4],"large":[6],"number":[7],"of":[8,21],"agents":[9,84],"to":[10,13,88],"learn":[11,126],"how":[12],"flock.":[14],"This":[15],"problem":[16,38],"has":[17],"drawn":[18],"lot":[20],"interest":[22],"but":[23],"requires":[24],"many":[25],"structural":[26],"assumptions":[27],"and":[28,62,82,99,110],"is":[29],"tractable":[30,69],"only":[31,72],"in":[32],"small":[33],"dimensions.":[34],"phrase":[36],"this":[37],"as":[39],"Mean":[41],"Field":[42],"Game":[43],"(MFG),":[44],"where":[45],"each":[46],"individual":[47],"chooses":[48],"its":[49],"own":[50],"acceleration":[51],"depending":[52],"on":[53],"the":[54,83,90,113],"population":[55,115],"behavior.":[56],"Combining":[57],"Deep":[58,108],"Reinforcement":[59],"Learning":[60],"(RL)":[61],"Normalizing":[63],"Flows":[64],"(NF),":[65],"we":[66],"obtain":[67],"solution":[70],"requiring":[71],"very":[73],"weak":[74],"assumptions.":[75],"Our":[76],"algorithm":[77,124],"finds":[78],"Nash":[80],"Equilibrium":[81],"adapt":[85],"their":[86],"velocity":[87],"match":[89],"neighboring":[91],"flock\u2019s":[92],"average":[93],"one.":[94],"use":[96],"Fictitious":[97],"Play":[98],"alternate:":[100],"(1)":[101],"computing":[102],"an":[103],"approximate":[104],"best":[105],"response":[106],"with":[107,117,131],"RL,":[109],"(2)":[111],"estimating":[112],"next":[114],"distribution":[116],"NF.":[118],"show":[120],"numerically":[121],"that":[122],"our":[123],"can":[125],"multi-group":[127],"or":[128],"high-dimensional":[129],"flocking":[130],"obstacles.":[132]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
