{"id":"https://openalex.org/W4385565498","doi":"https://doi.org/10.1145/3580305.3599359","title":"GAT-MF: Graph Attention Mean Field for Very Large Scale Multi-Agent Reinforcement Learning","display_name":"GAT-MF: Graph Attention Mean Field for Very Large Scale Multi-Agent Reinforcement Learning","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385565498","doi":"https://doi.org/10.1145/3580305.3599359"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599359","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051274227","display_name":"Qianyue Hao","orcid":"https://orcid.org/0000-0002-7109-3588"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qianyue Hao","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111794931","display_name":"Wenzhen Huang","orcid":"https://orcid.org/0000-0003-0454-7516"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenzhen Huang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101472243","display_name":"Tao Feng","orcid":"https://orcid.org/0000-0002-7341-0225"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Feng","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100347994","display_name":"Jian Yuan","orcid":"https://orcid.org/0000-0001-9734-6056"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Yuan","raw_affiliation_strings":["Tsinghua University, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100355277","display_name":"Yong Li","orcid":"https://orcid.org/0000-0001-5617-1659"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Li","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5051274227"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":3.1109,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.93175054,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"685","last_page":"697"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.972100019454956,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9240999817848206,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8572701215744019},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7714072465896606},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.7517392635345459},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5105270147323608},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4869016706943512},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4561956524848938},{"id":"https://openalex.org/keywords/mathematical-proof","display_name":"Mathematical proof","score":0.4501948654651642},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4198416769504547},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3937840461730957},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.37647223472595215},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10967165231704712},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1075146496295929}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8572701215744019},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7714072465896606},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.7517392635345459},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5105270147323608},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4869016706943512},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4561956524848938},{"id":"https://openalex.org/C108710211","wikidata":"https://www.wikidata.org/wiki/Q11538","display_name":"Mathematical proof","level":2,"score":0.4501948654651642},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4198416769504547},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3937840461730957},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37647223472595215},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10967165231704712},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1075146496295929},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599359","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.4099999964237213}],"awards":[{"id":"https://openalex.org/G1005744610","display_name":null,"funder_award_id":"61972223, U1936217, 61971267","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1614471940","display_name":null,"funder_award_id":"2020AAA0","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3710896277","display_name":null,"funder_award_id":"61971267","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3734416573","display_name":null,"funder_award_id":"61972223","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4872662616","display_name":null,"funder_award_id":"U1936217","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7024251178","display_name":null,"funder_award_id":"2020AAA0106000","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329777","display_name":"Beijing National Research Center For Information Science And Technology","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2617547828","https://openalex.org/W2794643322","https://openalex.org/W2963725394","https://openalex.org/W2981224708","https://openalex.org/W2997070234","https://openalex.org/W2997940961","https://openalex.org/W2998367975","https://openalex.org/W2998489261","https://openalex.org/W3013198216","https://openalex.org/W3041678225","https://openalex.org/W3133972827","https://openalex.org/W3145159167","https://openalex.org/W3153079815","https://openalex.org/W3171599858","https://openalex.org/W3190593074","https://openalex.org/W3195968524","https://openalex.org/W3208346261","https://openalex.org/W3208460365","https://openalex.org/W3212219118","https://openalex.org/W4225665995","https://openalex.org/W4290943900","https://openalex.org/W6803519892"],"related_works":["https://openalex.org/W1667647204","https://openalex.org/W2404647514","https://openalex.org/W4247536566","https://openalex.org/W2018477250","https://openalex.org/W3119814709","https://openalex.org/W4241418540","https://openalex.org/W1508895727","https://openalex.org/W2725786787","https://openalex.org/W1875930651","https://openalex.org/W55831818"],"abstract_inverted_index":{"Recent":[0],"advancements":[1],"in":[2,42,80,96,102,160,207],"reinforcement":[3,26],"learning":[4,27],"have":[5],"witnessed":[6],"remarkable":[7,237],"achievements":[8],"by":[9],"intelligent":[10],"agents":[11,60,70,110,115],"ranging":[12],"from":[13],"game-playing":[14],"to":[15,45,54,122,186,253],"industrial":[16],"applications.":[17],"Of":[18],"particular":[19],"interest":[20],"is":[21],"the":[22,67,84,91,105,189,219,231,254],"area":[23],"of":[24,48,59,66,69,86,93,107,170,176,194,200,221,239],"multi-agent":[25,81],"(MARL),":[28],"which":[29],"holds":[30],"significant":[31],"potential":[32],"for":[33],"real-world":[34,211],"scenarios.":[35],"However,":[36],"typical":[37],"MARL":[38],"methods":[39],"are":[40,78,265],"limited":[41],"their":[43],"ability":[44],"handle":[46],"tens":[47],"agents,":[49,94,216],"leaving":[50],"scenarios":[51,212],"with":[52,90,173,235],"up":[53,65],"hundreds":[55],"or":[56],"even":[57],"thousands":[58],"almost":[61],"unexplored.":[62],"The":[63,163,224],"scaling":[64],"number":[68,85,92],"presents":[71],"two":[72],"primary":[73],"challenges:":[74],"(1)":[75],"agent-agent":[76,143],"interactions":[77,87,108,144,146],"crucial":[79],"systems":[82],"while":[83],"grows":[88],"quadratically":[89],"resulting":[95],"substantial":[97,158],"computational":[98,161],"complexity":[99],"and":[100,116,150,191,210,248,263],"difficulty":[101],"strategies-learning;":[103],"(2)":[104],"strengths":[106,193],"among":[109],"exhibit":[111],"variations":[112],"both":[113,208],"across":[114],"over":[117,214],"time,":[118],"making":[119],"it":[120],"difficult":[121],"precisely":[123],"model":[124],"such":[125],"interactions.":[126,202],"In":[127],"this":[128],"paper,":[129],"we":[130,155,180,217],"propose":[131],"a":[132,151,157,167,182,236],"novel":[133],"approach":[134],"named":[135],"Graph":[136],"Attention":[137],"Mean":[138],"Field":[139],"(GAT-MF).":[140],"By":[141],"converting":[142],"into":[145],"between":[147],"each":[148],"agent":[149,201],"weighted":[152],"mean":[153],"field,":[154],"achieve":[156],"reduction":[159],"complexity.":[162],"proposed":[164],"method":[165,229,234,243],"offers":[166],"precise":[168],"modeling":[169],"interaction":[171],"dynamics":[172],"mathematical":[174],"proofs":[175],"its":[177],"correctness.":[178],"Additionally,":[179],"design":[181],"graph":[183],"attention":[184],"mechanism":[185],"automatically":[187],"capture":[188],"diverse":[190],"time-varying":[192],"interactions,":[195],"ensuring":[196],"an":[197],"accurate":[198],"representation":[199],"Through":[203],"extensive":[204],"experimentation":[205],"conducted":[206],"manual":[209],"involving":[213],"3000":[215],"validate":[218],"efficacy":[220],"our":[222,228,242,260],"method.":[223,257],"results":[225],"demonstrate":[226],"that":[227],"outperforms":[230],"best":[232,255],"baseline":[233,256],"improvement":[238],"42.7%.":[240],"Furthermore,":[241],"saves":[244],"86.4%":[245],"training":[246],"time":[247],"19.2%":[249],"GPU":[250],"memory":[251],"compared":[252],"For":[258],"reproducibility,":[259],"source":[261],"codes":[262],"data":[264],"available":[266],"at":[267],"https://github.com/tsinghua-fib-lab/Large-Scale-MARL-GATMF.":[268]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":7}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
