{"id":"https://openalex.org/W7143510601","doi":"https://doi.org/10.1016/j.asoc.2026.115145","title":"Efficient multi-agent deep reinforcement learning algorithm for multi UAV collision avoidance","display_name":"Efficient multi-agent deep reinforcement learning algorithm for multi UAV collision avoidance","publication_year":2026,"publication_date":"2026-03-30","ids":{"openalex":"https://openalex.org/W7143510601","doi":"https://doi.org/10.1016/j.asoc.2026.115145"},"language":"en","primary_location":{"id":"doi:10.1016/j.asoc.2026.115145","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.asoc.2026.115145","pdf_url":null,"source":{"id":"https://openalex.org/S140556538","display_name":"Applied Soft Computing","issn_l":"1568-4946","issn":["1568-4946","1872-9681"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Soft Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.asoc.2026.115145","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075334437","display_name":"Mohammad Reza Rezaee","orcid":"https://orcid.org/0000-0002-8807-0083"},"institutions":[{"id":"https://openalex.org/I130343225","display_name":"Universiti Putra Malaysia","ror":"https://ror.org/02e91jd64","country_code":"MY","type":"education","lineage":["https://openalex.org/I130343225"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Mohammad Reza Rezaee","raw_affiliation_strings":["Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia"],"raw_orcid":"https://orcid.org/0000-0002-8807-0083","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","institution_ids":["https://openalex.org/I130343225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020450057","display_name":"Nor Asilah Wati Abdul Hamid","orcid":"https://orcid.org/0000-0001-8095-7678"},"institutions":[{"id":"https://openalex.org/I130343225","display_name":"Universiti Putra Malaysia","ror":"https://ror.org/02e91jd64","country_code":"MY","type":"education","lineage":["https://openalex.org/I130343225"]}],"countries":["MY"],"is_corresponding":true,"raw_author_name":"Nor Asilah Wati Abdul Hamid","raw_affiliation_strings":["Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","Institute for Mathematical Research, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia"],"raw_orcid":"https://orcid.org/0000-0001-8095-7678","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","institution_ids":["https://openalex.org/I130343225"]},{"raw_affiliation_string":"Institute for Mathematical Research, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","institution_ids":["https://openalex.org/I130343225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109069502","display_name":"M. F. H. Hussin","orcid":null},"institutions":[{"id":"https://openalex.org/I130343225","display_name":"Universiti Putra Malaysia","ror":"https://ror.org/02e91jd64","country_code":"MY","type":"education","lineage":["https://openalex.org/I130343225"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Masnida Hussin","raw_affiliation_strings":["Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia"],"raw_orcid":"https://orcid.org/0000-0003-1063-8502","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","institution_ids":["https://openalex.org/I130343225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056464097","display_name":"Zuriati Ahmad Zukarnain","orcid":"https://orcid.org/0000-0003-2408-6956"},"institutions":[{"id":"https://openalex.org/I130343225","display_name":"Universiti Putra Malaysia","ror":"https://ror.org/02e91jd64","country_code":"MY","type":"education","lineage":["https://openalex.org/I130343225"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Zuriati Ahmad Zukarnain","raw_affiliation_strings":["Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia"],"raw_orcid":"https://orcid.org/0000-0003-2408-6956","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science and Information Technology, Universiti Putra Malaysia, Serdang, 43400, Selangor, Malaysia","institution_ids":["https://openalex.org/I130343225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020450057"],"corresponding_institution_ids":["https://openalex.org/I130343225"],"apc_list":{"value":3350,"currency":"USD","value_usd":3350},"apc_paid":{"value":3350,"currency":"USD","value_usd":3350},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.69991628,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"197","issue":null,"first_page":"115145","last_page":"115145"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.5526000261306763,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.5526000261306763,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11489","display_name":"Air Traffic Management and Optimization","score":0.22169999778270721,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.02800000086426735,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8646000027656555},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.7669000029563904},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7477999925613403},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.59170001745224},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5612999796867371},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.45570001006126404},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.44350001215934753},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4027999937534332}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8646000027656555},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7944999933242798},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.7669000029563904},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7477999925613403},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.59170001745224},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5612999796867371},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.553600013256073},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.45570001006126404},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.44350001215934753},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.36880001425743103},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36640000343322754},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3564999997615814},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.33880001306533813},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.3098999857902527},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.30079999566078186},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2840000092983246},{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2535000145435333}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1016/j.asoc.2026.115145","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.asoc.2026.115145","pdf_url":null,"source":{"id":"https://openalex.org/S140556538","display_name":"Applied Soft Computing","issn_l":"1568-4946","issn":["1568-4946","1872-9681"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Soft Computing","raw_type":"journal-article"},{"id":"pmh:oai:psasir.upm.edu.my:125195","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196260","display_name":"Universiti Putra Malaysia Institutional Repository (Universiti Putra Malaysia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130343225","host_organization_name":"Universiti Putra Malaysia","host_organization_lineage":["https://openalex.org/I130343225"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"doi:10.1016/j.asoc.2026.115145","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.asoc.2026.115145","pdf_url":null,"source":{"id":"https://openalex.org/S140556538","display_name":"Applied Soft Computing","issn_l":"1568-4946","issn":["1568-4946","1872-9681"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Soft Computing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320338279","display_name":"Air Force Office of Scientific Research","ror":"https://ror.org/011e9bt93"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W2067246174","https://openalex.org/W2124497430","https://openalex.org/W2623202212","https://openalex.org/W3006868075","https://openalex.org/W3035633917","https://openalex.org/W3047375952","https://openalex.org/W3123270512","https://openalex.org/W3153187775","https://openalex.org/W3169726339","https://openalex.org/W3198247306","https://openalex.org/W3215041652","https://openalex.org/W4283808151","https://openalex.org/W4313485422","https://openalex.org/W4318217967","https://openalex.org/W4321608219","https://openalex.org/W4321792508","https://openalex.org/W4322495590","https://openalex.org/W4365563312","https://openalex.org/W4366606012","https://openalex.org/W4383740955","https://openalex.org/W4385345048","https://openalex.org/W4386157387","https://openalex.org/W4388543717","https://openalex.org/W4391741219","https://openalex.org/W4393140099","https://openalex.org/W4393304821","https://openalex.org/W4395678331","https://openalex.org/W4396712697","https://openalex.org/W4401748410","https://openalex.org/W4401835755","https://openalex.org/W4402217167","https://openalex.org/W4404599563","https://openalex.org/W4408100269","https://openalex.org/W4408791788","https://openalex.org/W4411336769","https://openalex.org/W4415218736","https://openalex.org/W7116659924"],"related_works":[],"abstract_inverted_index":{"The":[0,16,162],"rapid":[1],"expansion":[2],"of":[3,19,39,50,259],"uncrewed":[4],"aerial":[5],"vehicles":[6],"(UAVs)":[7],"across":[8,21],"industries":[9],"has":[10,26],"led":[11],"to":[12,66,87,94,193,247],"increased":[13],"airspace":[14],"congestion.":[15],"increasing":[17,257],"use":[18],"drones":[20,93],"many":[22,60],"fields":[23],"and":[24,46,99,139,148,159,199,267],"locations":[25],"caused":[27],"serious":[28],"problems,":[29],"especially":[30],"in":[31,74,102,127,177,219,236],"avoiding":[32],"collisions.":[33],"In":[34],"the":[35,48,155,169,174,184,207,210,264],"rapidly":[36],"developing":[37],"field":[38],"drone":[40,132],"technology,":[41],"ensuring":[42],"UAV":[43,51,233,249,260],"flight":[44],"safety":[45],"reducing":[47],"risk":[49],"collisions":[52],"have":[53],"therefore":[54],"become":[55],"urgent":[56],"concerns.":[57],"There":[58],"are":[59],"artificial":[61],"intelligence":[62,98],"(AI)":[63],"algorithms":[64],"designed":[65],"solve":[67,88],"this":[68],"problem,":[69],"but":[70],"most":[71],"work":[72,109],"only":[73],"situations":[75],"with":[76,96,256],"a":[77,84,111,128],"single":[78],"agent.":[79],"Multi-agent":[80],"reinforcement":[81],"learning":[82,138,141,151],"is":[83,165],"promising":[85],"way":[86],"these":[89],"problems.":[90],"It":[91],"enables":[92],"operate":[95],"greater":[97],"flexibility,":[100],"even":[101],"challenging":[103],"situations,":[104],"alongside":[105],"other":[106],"agents.":[107],"This":[108,153],"presents":[110],"Multi-Agent":[112,227],"Deep":[113,228],"Reinforcement":[114,229],"Learning":[115,230],"Algorithm":[116,231],"based":[117,262],"on":[118,263],"an":[119,225,241],"efficient":[120,242],"graph":[121,243],"attention":[122,244],"network":[123,245],"for":[124,232],"collision":[125,234],"avoidance":[126,235],"dense,":[129],"complex":[130],"multi-agent":[131],"environment.":[133],"We":[134],"propose":[135],"both":[136],"curriculum":[137,268],"transfer":[140],"by":[142,168],"adding":[143],"more":[144,157,160],"agents":[145,261],"over":[146],"time":[147,197],"subsequently":[149],"employing":[150],"models.":[152],"makes":[154],"system":[156],"scalable":[158],"coordinated.":[161],"training":[163],"process":[164],"significantly":[166],"advanced":[167],"suggested":[170,265],"method,":[171],"which":[172],"outperforms":[173],"current":[175],"benchmark":[176],"continuous":[178],"settings.":[179,222],"Our":[180],"findings":[181],"indicate":[182],"that":[183],"proposed":[185,211],"approach":[186],"achieves":[187],"17%":[188],"higher":[189],"cumulative":[190],"reward,":[191],"up":[192],"10%":[194],"fewer":[195,202],"loss-of-separation":[196],"steps,":[198],"about":[200],"44%":[201],"active":[203],"interaction":[204],"edges":[205],"than":[206],"benchmark.":[208],"Furthermore,":[209],"method":[212],"reduces":[213],"action-selection":[214],"bias,":[215],"improving":[216],"decision-making":[217],"stability":[218],"dense":[220],"multi-UAV":[221],"\u2022":[223,239,252],"Suggest":[224],"Efficient":[226],"dynamic":[237],"environments.":[238],"Propose":[240],"architecture":[246,266],"model":[248],"interactions":[250],"efficiently.":[251],"Demonstrate":[253],"improved":[254],"scalability":[255],"numbers":[258],"learning.":[269]},"counts_by_year":[],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2026-03-31T00:00:00"}
