{"id":"https://openalex.org/W4417438566","doi":"https://doi.org/10.1109/mwc.2025.3630121","title":"Multimodal Large Language Models-Enabled UAV Swarm: Towards Efficient and Intelligent Autonomous Aerial Systems","display_name":"Multimodal Large Language Models-Enabled UAV Swarm: Towards Efficient and Intelligent Autonomous Aerial Systems","publication_year":2025,"publication_date":"2025-12-17","ids":{"openalex":"https://openalex.org/W4417438566","doi":"https://doi.org/10.1109/mwc.2025.3630121"},"language":null,"primary_location":{"id":"doi:10.1109/mwc.2025.3630121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mwc.2025.3630121","pdf_url":null,"source":{"id":"https://openalex.org/S146764194","display_name":"IEEE Wireless Communications","issn_l":"1536-1284","issn":["1536-1284","1558-0687"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Wireless Communications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102683343","display_name":"Yuqi Ping","orcid":"https://orcid.org/0009-0001-0795-1066"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuqi Ping","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001968310","display_name":"Tianhao Liang","orcid":"https://orcid.org/0000-0003-3628-364X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianhao Liang","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114173595","display_name":"Huahao Ding","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huahao Ding","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108955653","display_name":"Guangyu Lei","orcid":"https://orcid.org/0009-0000-7628-2778"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangyu Lei","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005014456","display_name":"Junwei Wu","orcid":"https://orcid.org/0000-0002-7346-5082"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junwei Wu","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100975073","display_name":"Xuan Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xuan Zou","raw_affiliation_strings":["Key Laboratory of Forest and Grassland Fire Risk Prevention, Ministry of Emergency Management, China Fire and Rescue Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Forest and Grassland Fire Risk Prevention, Ministry of Emergency Management, China Fire and Rescue Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087704283","display_name":"Kuan Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuan Shi","raw_affiliation_strings":["Key Laboratory of Forest and Grassland Fire Risk Prevention, Ministry of Emergency Management, China Fire and Rescue Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Forest and Grassland Fire Risk Prevention, Ministry of Emergency Management, China Fire and Rescue Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037878863","display_name":"Rui Shao","orcid":"https://orcid.org/0000-0003-0090-9604"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Shao","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029086169","display_name":"Chiya Zhang","orcid":"https://orcid.org/0000-0002-1113-4659"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chiya Zhang","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101519463","display_name":"Weizheng Zhang","orcid":"https://orcid.org/0000-0002-3915-8361"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weizheng Zhang","raw_affiliation_strings":["College of Informatics, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011236120","display_name":"Weijie Yuan","orcid":"https://orcid.org/0000-0002-2158-0046"},"institutions":[{"id":"https://openalex.org/I165488957","display_name":"Lingnan University","ror":"https://ror.org/0563pg902","country_code":"HK","type":"education","lineage":["https://openalex.org/I165488957"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Weijie Yuan","raw_affiliation_strings":["School of Interdisciplinary Studies, Lingnan University, SAR, Hong Kong","School of Interdisciplinary Studies, Lingnan University, Hong Kong SAR"],"affiliations":[{"raw_affiliation_string":"School of Interdisciplinary Studies, Lingnan University, SAR, Hong Kong","institution_ids":["https://openalex.org/I165488957"]},{"raw_affiliation_string":"School of Interdisciplinary Studies, Lingnan University, Hong Kong SAR","institution_ids":["https://openalex.org/I165488957"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100329653","display_name":"Tingting Zhang","orcid":"https://orcid.org/0000-0003-2585-0290"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingting Zhang","raw_affiliation_strings":["College of Informatics and the Guangdong Provincial Key Laboratory of Space-Aerial Networking and Intelligent Sensing, Harbin Institute of Technology, Shenzhen, China","College of Informatics and the Guangdong Provincial Key Laboratory of Space-Aerial Networking and Intelligent Sensing, Harbin Institute of Technology, Shenzhen 518000, China, and also with the Peng Cheng Laboratory, Shenzhen, P. R. China"],"affiliations":[{"raw_affiliation_string":"College of Informatics and the Guangdong Provincial Key Laboratory of Space-Aerial Networking and Intelligent Sensing, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"College of Informatics and the Guangdong Provincial Key Laboratory of Space-Aerial Networking and Intelligent Sensing, Harbin Institute of Technology, Shenzhen 518000, China, and also with the Peng Cheng Laboratory, Shenzhen, P. R. China","institution_ids":["https://openalex.org/I4210136793"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5102683343"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":3.8352,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.94357588,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"33","issue":"1","first_page":"89","last_page":"97"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5782999992370605,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.5782999992370605,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.062199998646974564,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12597","display_name":"Fire Detection and Safety Systems","score":0.06199999898672104,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.7573000192642212},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.6740000247955322},{"id":"https://openalex.org/keywords/situation-awareness","display_name":"Situation awareness","score":0.5958999991416931},{"id":"https://openalex.org/keywords/swarm-behaviour","display_name":"Swarm behaviour","score":0.4702000021934509},{"id":"https://openalex.org/keywords/firefighting","display_name":"Firefighting","score":0.4625000059604645},{"id":"https://openalex.org/keywords/swarm-intelligence","display_name":"Swarm intelligence","score":0.33899998664855957}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.82669997215271},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.7573000192642212},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.6740000247955322},{"id":"https://openalex.org/C145804949","wikidata":"https://www.wikidata.org/wiki/Q478123","display_name":"Situation awareness","level":2,"score":0.5958999991416931},{"id":"https://openalex.org/C181335050","wikidata":"https://www.wikidata.org/wiki/Q14915018","display_name":"Swarm behaviour","level":2,"score":0.4702000021934509},{"id":"https://openalex.org/C557531904","wikidata":"https://www.wikidata.org/wiki/Q897825","display_name":"Firefighting","level":2,"score":0.4625000059604645},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.45489999651908875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44269999861717224},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.36250001192092896},{"id":"https://openalex.org/C119487961","wikidata":"https://www.wikidata.org/wiki/Q863960","display_name":"Swarm intelligence","level":3,"score":0.33899998664855957},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.33090001344680786},{"id":"https://openalex.org/C56397880","wikidata":"https://www.wikidata.org/wiki/Q6044094","display_name":"Intelligent decision support system","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C145424490","wikidata":"https://www.wikidata.org/wiki/Q618465","display_name":"Remotely operated underwater vehicle","level":4,"score":0.2734000086784363},{"id":"https://openalex.org/C169337768","wikidata":"https://www.wikidata.org/wiki/Q2446723","display_name":"Swarm robotics","level":3,"score":0.2694999873638153},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.26030001044273376}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mwc.2025.3630121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mwc.2025.3630121","pdf_url":null,"source":{"id":"https://openalex.org/S146764194","display_name":"IEEE Wireless Communications","issn_l":"1536-1284","issn":["1536-1284","1558-0687"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Wireless Communications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W4384158407","https://openalex.org/W4393405282","https://openalex.org/W4394730983","https://openalex.org/W4402727764","https://openalex.org/W4404103156","https://openalex.org/W4404356490","https://openalex.org/W4406207083","https://openalex.org/W4409311614","https://openalex.org/W4410628584","https://openalex.org/W4410852594","https://openalex.org/W4413917076","https://openalex.org/W4414155281"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"breakthroughs":[1],"in":[2,34],"multimodal":[3],"large":[4],"language":[5],"models":[6],"(MLLMs)":[7],"have":[8],"endowed":[9],"AI":[10],"systems":[11],"with":[12,54],"unified":[13],"perception,":[14],"reasoning,":[15],"and":[16,22,43,60,72,76,90,115,123],"natural-language":[17],"interaction":[18],"across":[19,62],"text,":[20],"image,":[21],"video":[23,133],"modalities.":[24],"Meanwhile,":[25],"unmanned":[26],"aerial":[27],"vehicle":[28],"(UAV)":[29],"swarms":[30,56],"are":[31],"increasingly":[32],"deployed":[33],"dynamic,":[35],"safety-critical":[36],"missions":[37],"that":[38,111],"demand":[39],"rapid":[40],"situational":[41],"awareness":[42],"autonomous":[44],"adaptation.":[45],"This":[46],"paper":[47],"explores":[48],"potential":[49],"solutions":[50],"for":[51,84,127],"integrating":[52],"MLLMs":[53],"UAV":[55,87,129],"to":[57],"enhance":[58],"intelligence":[59],"adaptability":[61],"diverse":[63],"tasks.":[64],"Specifically,":[65],"we":[66,79,97,119],"first":[67],"outline":[68],"the":[69,92,99,102,121,135],"fundamental":[70],"architectures":[71],"functions":[73],"of":[74,101,134],"UAVs":[75],"MLLMs.":[77],"Then,":[78],"present":[80],"a":[81,106],"comprehensive":[82],"framework":[83,104],"an":[85],"MLLM-enabled":[86,128],"swarm":[88],"system":[89],"discuss":[91,120],"opportunities":[93],"it":[94],"offers.":[95],"Next,":[96],"demonstrate":[98],"capabilities":[100],"proposed":[103],"through":[105],"forest":[107],"firefighting":[108],"case":[109],"study":[110],"includes":[112],"both":[113],"simulation":[114],"real-world":[116],"experiments.":[117],"Finally,":[118],"challenges":[122],"future":[124],"research":[125],"directions":[126],"swarms.":[130],"An":[131],"illustrative":[132],"experiments":[136],"is":[137],"available":[138],"at":[139],"<uri":[140],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[141],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://youtu.be/zwnB9ZSa5A4</uri>.":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-17T00:00:00"}
