{"id":"https://openalex.org/W4412549458","doi":"https://doi.org/10.32604/cmc.2025.067117","title":"Dynamic Decoupling-Driven Cooperative Pursuit for Multi-UAV Systems: A Multi-Agent Reinforcement Learning Policy Optimization Approach","display_name":"Dynamic Decoupling-Driven Cooperative Pursuit for Multi-UAV Systems: A Multi-Agent Reinforcement Learning Policy Optimization Approach","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412549458","doi":"https://doi.org/10.32604/cmc.2025.067117"},"language":"en","primary_location":{"id":"doi:10.32604/cmc.2025.067117","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.067117","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.32604/cmc.2025.067117","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111381951","display_name":"Lei Lei","orcid":"https://orcid.org/0000-0001-5891-5236"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lei Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051354465","display_name":"Chengfu Wu","orcid":"https://orcid.org/0000-0002-4256-5021"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chengfu Wu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5021518674","display_name":"Huai\u2010Min Chen","orcid":"https://orcid.org/0000-0003-3553-2608"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huaimin Chen","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5111381951"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.9443,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.96742844,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"85","issue":"1","first_page":"1339","last_page":"1363"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.9483000040054321,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.9483000040054321,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9347000122070312,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9265999794006348,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8568670749664307},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.8081930875778198},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5891093611717224},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4419420659542084},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4205833375453949},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.35070693492889404},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3270486295223236},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.23733261227607727},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18353262543678284},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11396285891532898},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.06445127725601196}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8568670749664307},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.8081930875778198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5891093611717224},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4419420659542084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4205833375453949},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.35070693492889404},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3270486295223236},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.23733261227607727},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18353262543678284},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11396285891532898},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.06445127725601196}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.32604/cmc.2025.067117","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.067117","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.32604/cmc.2025.067117","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.067117","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2408768628","https://openalex.org/W2782943365","https://openalex.org/W2810602713","https://openalex.org/W2895855868","https://openalex.org/W2945675984","https://openalex.org/W2981038142","https://openalex.org/W2991046523","https://openalex.org/W3000179003","https://openalex.org/W3014355579","https://openalex.org/W3085472573","https://openalex.org/W3094093649","https://openalex.org/W3198771491","https://openalex.org/W3203531525","https://openalex.org/W3209575760","https://openalex.org/W3209642584","https://openalex.org/W3214814008","https://openalex.org/W4205319053","https://openalex.org/W4213246061","https://openalex.org/W4226329847","https://openalex.org/W4310576394","https://openalex.org/W4312987110","https://openalex.org/W4392173075","https://openalex.org/W4403765774","https://openalex.org/W4407956488","https://openalex.org/W4408791788"],"related_works":["https://openalex.org/W4313561376","https://openalex.org/W3103825105","https://openalex.org/W3027880158","https://openalex.org/W3207533102","https://openalex.org/W1617565119","https://openalex.org/W160381218","https://openalex.org/W2512958550","https://openalex.org/W4306904969","https://openalex.org/W2004102934","https://openalex.org/W4366455350"],"abstract_inverted_index":{"This":[0,114],"paper":[1],"proposes":[2],"a":[3,58,91,154,170,174],"Multi-Agent":[4],"Attention":[5],"Proximal":[6],"Policy":[7],"Optimization":[8],"(MA2PPO)":[9],"algorithm":[10,194,216],"aiming":[11],"at":[12],"the":[13,29,64,73,81,98,110,117,144,162,166,189,192,215],"problems":[14,138],"such":[15,50],"as":[16],"credit":[17,111],"assignment,":[18],"low":[19,54],"collaboration":[20],"efficiency":[21,56,146],"and":[22,57,89,130,134,147,200],"weak":[23],"strategy":[24],"generalization":[25],"ability":[26],"existing":[27],"in":[28,49,61,195],"cooperative":[30,47,183,198,203],"pursuit":[31,184,199,204],"tasks":[32],"of":[33,191],"multiple":[34,151],"unmanned":[35],"aerial":[36],"vehicles":[37],"(UAVs).":[38],"Traditional":[39],"algorithms":[40],"often":[41],"fail":[42],"to":[43,53,108,119,160,164,180],"effectively":[44,127],"identify":[45,120],"critical":[46],"relationships":[48],"tasks,":[51],"leading":[52],"capture":[55],"significant":[59],"decline":[60],"performance":[62],"when":[63],"scale":[65],"expands.":[66],"To":[67],"tackle":[68],"these":[69],"issues,":[70],"based":[71],"on":[72,210],"proximal":[74],"policy":[75,148],"optimization":[76],"(PPO)":[77],"algorithm,":[78],"MA2PPO":[79],"adopts":[80],"centralized":[82,106],"training":[83,107],"with":[84,124,173],"decentralized":[85],"execution":[86],"(CTDE)":[87],"framework":[88],"introduces":[90],"dynamic":[92],"decoupling":[93],"mechanism,":[94],"that":[95,214],"is,":[96],"sharing":[97],"multi-head":[99],"attention":[100],"(MHA)":[101],"mechanism":[102],"for":[103,219],"critics":[104],"during":[105],"solve":[109],"assignment":[112],"problem.":[113],"method":[115],"enables":[116],"pursuers":[118,163],"highly":[121],"correlated":[122],"interactions":[123],"their":[125],"teammates,":[126],"eliminate":[128],"irrelevant":[129],"weakly":[131],"relevant":[132],"interactions,":[133],"decompose":[135],"large-scale":[136,220],"cooperation":[137],"into":[139],"decoupled":[140],"sub-problems,":[141],"thereby":[142],"enhancing":[143],"collaborative":[145],"stability":[149],"among":[150,206],"agents.":[152],"Furthermore,":[153],"reward":[155,172],"function":[156],"has":[157],"been":[158],"devised":[159],"facilitate":[161],"encircle":[165],"escapee":[167],"by":[168],"combining":[169],"formation":[171],"distance":[175],"reward,":[176],"which":[177],"incentivizes":[178],"UAVs":[179],"develop":[181],"sophisticated":[182],"strategies.":[185],"Experimental":[186],"results":[187],"demonstrate":[188],"effectiveness":[190],"proposed":[193],"achieving":[196],"multi-UAV":[197,221],"inducing":[201],"diverse":[202],"behaviors":[205],"UAVs.":[207],"Moreover,":[208],"experiments":[209],"scalability":[211],"have":[212],"demonstrated":[213],"is":[217],"suitable":[218],"systems.":[222]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
