{"id":"https://openalex.org/W4402628029","doi":"https://doi.org/10.1109/apwcs61586.2024.10679289","title":"Diffusion-Based Multi-Agent Reinforcement Learning with Communication","display_name":"Diffusion-Based Multi-Agent Reinforcement Learning with Communication","publication_year":2024,"publication_date":"2024-08-21","ids":{"openalex":"https://openalex.org/W4402628029","doi":"https://doi.org/10.1109/apwcs61586.2024.10679289"},"language":"en","primary_location":{"id":"doi:10.1109/apwcs61586.2024.10679289","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apwcs61586.2024.10679289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE VTS Asia Pacific Wireless Communications Symposium (APWCS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103944682","display_name":"Xinyue Qi","orcid":"https://orcid.org/0000-0001-5331-5274"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinyue Qi","raw_affiliation_strings":["College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics,China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003622027","display_name":"Jianhang Tang","orcid":"https://orcid.org/0000-0003-3329-9582"},"institutions":[{"id":"https://openalex.org/I178232147","display_name":"Guizhou University","ror":"https://ror.org/02wmsc916","country_code":"CN","type":"education","lineage":["https://openalex.org/I178232147"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhang Tang","raw_affiliation_strings":["Guizhou University,State Key Laboratory of Public Big Data,China"],"affiliations":[{"raw_affiliation_string":"Guizhou University,State Key Laboratory of Public Big Data,China","institution_ids":["https://openalex.org/I178232147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031914716","display_name":"Jiangming Jin","orcid":"https://orcid.org/0000-0001-7552-6937"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiangming Jin","raw_affiliation_strings":["Qingcheng AI"],"affiliations":[{"raw_affiliation_string":"Qingcheng AI","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100354608","display_name":"Yang Zhang","orcid":"https://orcid.org/0000-0001-9229-7689"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Zhang","raw_affiliation_strings":["College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics,China","institution_ids":["https://openalex.org/I9842412"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103944682"],"corresponding_institution_ids":["https://openalex.org/I9842412"],"apc_list":null,"apc_paid":null,"fwci":0.698,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72197233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.37389999628067017,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.37389999628067017,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7523036003112793},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.703635573387146},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5419860482215881},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.49384695291519165},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33375170826911926},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06658315658569336}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7523036003112793},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.703635573387146},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5419860482215881},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.49384695291519165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33375170826911926},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06658315658569336},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apwcs61586.2024.10679289","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apwcs61586.2024.10679289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE VTS Asia Pacific Wireless Communications Symposium (APWCS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.41999998688697815,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G6516776612","display_name":null,"funder_award_id":"62071343","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W3087576197","https://openalex.org/W4386076407","https://openalex.org/W6692846177","https://openalex.org/W6738796088","https://openalex.org/W6748839928","https://openalex.org/W6757469721","https://openalex.org/W6766805167","https://openalex.org/W6791040878","https://openalex.org/W6793444178","https://openalex.org/W6796589144","https://openalex.org/W6838483015","https://openalex.org/W6840380725","https://openalex.org/W6841549819","https://openalex.org/W6852710630","https://openalex.org/W6862975523"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Multi-agent":[0],"systems":[1,53,62],"(MAS)":[2],"have":[3],"been":[4],"widely":[5],"used":[6],"as":[7,20,60],"a":[8,90,114],"modeling":[9],"tool":[10],"to":[11,44,54,70,96],"analyze":[12],"the":[13],"behaviors":[14],"of":[15,28,47,83,108,138],"members":[16],"in":[17,51,77,113,136],"groups,":[18],"such":[19],"swarms,":[21],"autonomous":[22],"vehicle":[23],"fleets,":[24],"and":[25,35,49,66,73,80,123,141],"smart":[26],"Internet":[27],"Things":[29],"devices.":[30],"With":[31],"their":[32],"distributed":[33],"architecture":[34],"model-free":[36],"nature,":[37],"reinforcement":[38,85],"learning":[39,139],"(RL)":[40],"is":[41,111],"often":[42],"deployed":[43],"address":[45],"issues":[46],"decision-making":[48],"action-taking":[50],"multi-agent":[52,61,84,116],"optimize":[55],"overall":[56],"system":[57,104,118],"performance.":[58,143],"However,":[59],"involve":[63],"agent":[64],"coordination":[65],"interactions,":[67],"this":[68,109],"leads":[69],"extensive":[71],"communication":[72,102,129],"computation":[74],"overhead,":[75],"resulting":[76],"decreased":[78],"performance":[79],"slower":[81],"convergence":[82],"learning.":[86],"This":[87],"work":[88],"integrates":[89],"diffusion":[91],"model":[92],"into":[93,100],"RL":[94],"training":[95],"accelerate":[97],"decision-making,":[98],"taking":[99],"account":[101],"among":[103],"agents.":[105],"The":[106],"effectiveness":[107],"method":[110],"validated":[112],"grid-based":[115],"predator-prey":[117],"scenario,":[119],"where":[120],"agents":[121],"interact":[122],"confront":[124],"each":[125],"other":[126],"via":[127],"mutual":[128],"networks.":[130],"Experimental":[131],"results":[132],"show":[133],"significant":[134],"improvements":[135],"terms":[137],"efficiency":[140],"task":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-29T08:15:47.926485","created_date":"2025-10-10T00:00:00"}
