{"id":"https://openalex.org/W4409364162","doi":"https://doi.org/10.1609/aaai.v39i17.34021","title":"GTDE: Grouped Training with Decentralized Execution for Multi-agent Actor-Critic","display_name":"GTDE: Grouped Training with Decentralized Execution for Multi-agent Actor-Critic","publication_year":2025,"publication_date":"2025-04-11","ids":{"openalex":"https://openalex.org/W4409364162","doi":"https://doi.org/10.1609/aaai.v39i17.34021"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v39i17.34021","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i17.34021","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34021/36176","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34021/36176","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037430263","display_name":"Man Li","orcid":"https://orcid.org/0000-0002-8181-9688"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mengxian Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115695547","display_name":"Qi Wang","orcid":"https://orcid.org/0009-0000-0757-3627"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Wang","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101157792","display_name":"Yongjun Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongjun Xu","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences\nUniversity of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037430263"],"corresponding_institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":1.8141,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.83249428,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"39","issue":"17","first_page":"18368","last_page":"18376"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9739999771118164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9739999771118164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.7176032066345215},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47692984342575073},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.10339906811714172}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.7176032066345215},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47692984342575073},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.10339906811714172},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v39i17.34021","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i17.34021","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34021/36176","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v39i17.34021","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i17.34021","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/34021/36176","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409364162.pdf","grobid_xml":"https://content.openalex.org/works/W4409364162.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W230091440","https://openalex.org/W2390279801","https://openalex.org/W2233261550","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2810751659"],"abstract_inverted_index":{"The":[0,26],"rapid":[1],"advancement":[2],"of":[3,19,28,51,57,76,80,92,118,169,211],"multi-agent":[4,24,120],"reinforcement":[5],"learning":[6],"(MARL)":[7],"has":[8],"given":[9],"rise":[10],"to":[11,15,163,178,214],"diverse":[12],"training":[13,30,36,90,94,116],"paradigms":[14,27],"learn":[16],"the":[17,23,49,54,62,74,77,83,101,115,154,164,167,190,205,215,231],"policies":[18],"each":[20,132],"agent":[21,133],"in":[22,166,171,196],"system.":[25],"decentralized":[29,38,95],"and":[31,34,44,107],"execution":[32,39,96],"(DTDE)":[33],"centralized":[35,105],"with":[37,200,221],"(CTDE)":[40],"have":[41],"been":[42],"proposed":[43],"widely":[45],"applied.":[46],"However,":[47],"as":[48,66],"number":[50,79,168],"agents":[52,81],"increases,":[53],"inherent":[55],"limitations":[56],"these":[58],"frameworks":[59],"significantly":[60],"degrade":[61],"performance":[63,84],"metrics,":[64,85],"such":[65],"win":[67,228],"rate,":[68],"total":[69,206],"reward,":[70],"etc.":[71],"To":[72,142,161],"reduce":[73],"influence":[75],"increasing":[78],"on":[82,110,138,153],"we":[86,123],"propose":[87],"a":[88,104,172,180,197,218,226],"novel":[89],"paradigm":[91],"grouped":[93],"(GTDE).":[97],"This":[98],"framework":[99],"eliminates":[100],"need":[102],"for":[103,149],"module":[106,184],"relies":[108],"solely":[109],"local":[111],"information,":[112],"effectively":[113],"meeting":[114],"requirements":[117],"large-scale":[119],"systems.":[121],"Specifically,":[122],"first":[124],"introduce":[125],"an":[126,209],"adaptive":[127],"grouping":[128,155],"module,":[129],"which":[130],"divides":[131],"into":[134],"different":[135],"groups":[136],"based":[137],"their":[139],"observation":[140],"history.":[141],"implement":[143,179],"end-to-end":[144],"training,":[145],"GTDE":[146,203,224],"uses":[147],"Gumbel-Sigmoid":[148],"efficient":[150],"point-to-point":[151],"sampling":[152],"distribution":[156],"while":[157],"ensuring":[158],"gradient":[159],"backpropagation.":[160],"adapt":[162],"uncertainty":[165],"members":[170],"group,":[173],"two":[174],"methods":[175],"are":[176],"used":[177],"group":[181],"information":[182,188],"aggregation":[183],"that":[185,195],"merges":[186],"member":[187],"within":[189],"group.":[191],"Empirical":[192],"results":[193],"show":[194],"cooperative":[198],"environment":[199,220],"495":[201],"agents,":[202,223],"increased":[204],"reward":[207],"by":[208],"average":[210],"382%":[212],"compared":[213],"baseline.":[216,232],"In":[217],"competitive":[219],"64":[222],"achieved":[225],"100%":[227],"rate":[229],"against":[230]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
