{"id":"https://openalex.org/W4402156783","doi":"https://doi.org/10.1109/icc51166.2024.10622437","title":"HA-MARL: Heuristic and APF Assisted Multi-Agent Reinforcement Learning for Wireless Data Sharing in AUV Swarms","display_name":"HA-MARL: Heuristic and APF Assisted Multi-Agent Reinforcement Learning for Wireless Data Sharing in AUV Swarms","publication_year":2024,"publication_date":"2024-06-09","ids":{"openalex":"https://openalex.org/W4402156783","doi":"https://doi.org/10.1109/icc51166.2024.10622437"},"language":"en","primary_location":{"id":"doi:10.1109/icc51166.2024.10622437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icc51166.2024.10622437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICC 2024 - IEEE International Conference on Communications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100731664","display_name":"Zonglin Li","orcid":"https://orcid.org/0000-0002-4599-4112"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zonglin Li","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University,Shenzhen,China,518055"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033168204","display_name":"Jun Du","orcid":"https://orcid.org/0000-0002-5213-8808"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Du","raw_affiliation_strings":["Tsinghua University,Department of Electronic Engineering,Beijing,China,100083"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Electronic Engineering,Beijing,China,100083","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005072193","display_name":"Chunxiao Jiang","orcid":"https://orcid.org/0000-0002-3703-121X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunxiao Jiang","raw_affiliation_strings":["Tsinghua Space Center, Tsinghua University,Beijing,China,100083"],"affiliations":[{"raw_affiliation_string":"Tsinghua Space Center, Tsinghua University,Beijing,China,100083","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065214878","display_name":"Weishi Mi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weishi Mi","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University,Shenzhen,China,518055"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University,Shenzhen,China,518055","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109066646","display_name":"Yong Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Ren","raw_affiliation_strings":["Tsinghua University,Department of Electronic Engineering,Beijing,China,100083"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Electronic Engineering,Beijing,China,100083","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100731664"],"corresponding_institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.2225,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.52367968,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"5401","last_page":"5406"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10246","display_name":"Mobile Ad Hoc Networks","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7560692429542542},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.680361807346344},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6648166179656982},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.5618966817855835},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26041868329048157},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.18756696581840515}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7560692429542542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.680361807346344},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6648166179656982},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.5618966817855835},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26041868329048157},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.18756696581840515}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icc51166.2024.10622437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icc51166.2024.10622437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICC 2024 - IEEE International Conference on Communications","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3010749700","display_name":null,"funder_award_id":"61971257,U23A20281,62325108","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W2978329087","https://openalex.org/W3089283090","https://openalex.org/W3118592785","https://openalex.org/W3176048614","https://openalex.org/W3217049948","https://openalex.org/W4298848549","https://openalex.org/W4304987262","https://openalex.org/W4313030791","https://openalex.org/W6748523217","https://openalex.org/W6781210820","https://openalex.org/W6840380725"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890"],"abstract_inverted_index":{"This":[0],"paper":[1],"focuses":[2],"on":[3],"the":[4,23,50,63,78,101,145],"design":[5],"of":[6,65,103],"intelligent":[7,42],"game":[8,43],"strategy":[9,44],"for":[10,119],"multi-autonomous":[11],"underwater":[12,15,31,35],"vehicle":[13],"(multi-AUV)":[14],"network":[16],"system.":[17],"The":[18],"challenge":[19],"lies":[20],"in":[21,29,70,106],"ensuring":[22],"coordination":[24,79],"and":[25,76,86,114],"stability":[26],"between":[27],"AUVs":[28],"complex":[30],"environments.":[32],"To":[33],"meet":[34],"data":[36],"sharing":[37],"requirements,":[38],"we":[39,82],"formulate":[40],"an":[41],"incorporating":[45],"communication":[46],"delays":[47],"by":[48,108],"formulating":[49],"problem":[51],"as":[52,111],"a":[53,84],"partially":[54],"observable":[55],"Markov":[56],"decision":[57],"process":[58],"(POMDP).":[59],"Additionally,":[60],"to":[61,122],"address":[62],"issue":[64,102],"sparse":[66,104],"rewards":[67,105],"during":[68],"exploration":[69],"multi-agent":[71,91],"reinforcement":[72],"learning":[73],"(MARL)":[74],"models":[75],"improve":[77],"among":[80],"AUVs,":[81],"propose":[83],"heuristic":[85,117],"artificial":[87],"potential":[88],"field":[89],"(APF)-assisted":[90],"proximal":[92],"policy":[93],"optimization":[94],"(HA-MAPPO)":[95],"algorithm.":[96],"Our":[97],"proposed":[98,132],"scheme":[99],"addresses":[100],"MARL":[107,138],"using":[109],"APF":[110],"path":[112],"planner":[113],"subsequently":[115],"utilizes":[116],"algorithm":[118,134],"task":[120],"scheduling":[121],"achieve":[123],"optimal":[124],"goal":[125],"allocation.":[126],"Simulation":[127],"results":[128],"demonstrate":[129],"that":[130],"our":[131],"HA-MAPPO":[133],"outperforms":[135],"current":[136],"mainstream":[137],"algorithms":[139],"regarding":[140],"convergence":[141],"speed":[142],"while":[143],"maximizing":[144],"winning":[146],"rates.":[147]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
