{"id":"https://openalex.org/W4408145129","doi":"https://doi.org/10.1109/access.2025.3547825","title":"Autonomous Aerial Vehicle Object Detection Based on Spatial Perception and Multiscale Semantic and Detail Feature Fusion","display_name":"Autonomous Aerial Vehicle Object Detection Based on Spatial Perception and Multiscale Semantic and Detail Feature Fusion","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408145129","doi":"https://doi.org/10.1109/access.2025.3547825"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3547825","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3547825","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3547825","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013535253","display_name":"Wei Rao","orcid":"https://orcid.org/0000-0002-5738-0759"},"institutions":[{"id":"https://openalex.org/I141103825","display_name":"Jiangxi University of Water Resources and Electric Power","ror":"https://ror.org/00avfj807","country_code":"CN","type":"education","lineage":["https://openalex.org/I141103825"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Rao","raw_affiliation_strings":["Nanchang Institute of Technology, Nanchang, China"],"raw_orcid":"https://orcid.org/0000-0002-5738-0759","affiliations":[{"raw_affiliation_string":"Nanchang Institute of Technology, Nanchang, China","institution_ids":["https://openalex.org/I141103825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100429227","display_name":"Siyuan Chen","orcid":"https://orcid.org/0000-0001-9100-9809"},"institutions":[{"id":"https://openalex.org/I141103825","display_name":"Jiangxi University of Water Resources and Electric Power","ror":"https://ror.org/00avfj807","country_code":"CN","type":"education","lineage":["https://openalex.org/I141103825"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Chen","raw_affiliation_strings":["Nanchang Institute of Technology, Nanchang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nanchang Institute of Technology, Nanchang, China","institution_ids":["https://openalex.org/I141103825"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100380731","display_name":"Dan Li","orcid":"https://orcid.org/0000-0002-4759-565X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dan Li","raw_affiliation_strings":["Key Laboratory for Information Science of Electromagnetic Waves, Research Center of Smart Networks and Systems, School of Information Science and Technology, Fudan University, Shanghai, China","School of Information Science and Technology, Key Laboratory for Information Science of Electromagnetic Waves and the Research Center of Smart Networks and Systems, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4759-565X","affiliations":[{"raw_affiliation_string":"Key Laboratory for Information Science of Electromagnetic Waves, Research Center of Smart Networks and Systems, School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Information Science and Technology, Key Laboratory for Information Science of Electromagnetic Waves and the Research Center of Smart Networks and Systems, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":3.907,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91597987,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"13","issue":null,"first_page":"42897","last_page":"42909"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14257","display_name":"Advanced Measurement and Detection Methods","score":0.9818000197410583,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9538999795913696,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7720739841461182},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7107622623443604},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6537719964981079},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5979864597320557},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5905733108520508},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.5333789587020874},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5311504602432251},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.499298095703125},{"id":"https://openalex.org/keywords/aerial-image","display_name":"Aerial image","score":0.4677693247795105},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.44764986634254456},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4410487115383148},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4350340664386749},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.42858651280403137},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.09581339359283447}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7720739841461182},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7107622623443604},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6537719964981079},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5979864597320557},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5905733108520508},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.5333789587020874},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5311504602432251},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.499298095703125},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.4677693247795105},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.44764986634254456},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4410487115383148},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4350340664386749},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.42858651280403137},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.09581339359283447},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3547825","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3547825","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:744a57b674ae454ab6c12dcd8763350d","is_oa":true,"landing_page_url":"https://doaj.org/article/744a57b674ae454ab6c12dcd8763350d","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 42897-42909 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3547825","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3547825","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6971886382","display_name":"\u57fa\u4e8e\u5f20\u91cf\u5206\u89e3\u7684\u9ad8\u9636\u5747\u5300/\u975e\u5747\u5300\u9635\u5217\u4fe1\u53f7\u5904\u7406\u7814\u7a76","funder_award_id":"61961025","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8625978647","display_name":null,"funder_award_id":"20202BABL202001","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W2102605133","https://openalex.org/W2144506857","https://openalex.org/W2151103935","https://openalex.org/W2161969291","https://openalex.org/W2570343428","https://openalex.org/W2962766617","https://openalex.org/W2963037989","https://openalex.org/W2963857746","https://openalex.org/W2964121718","https://openalex.org/W3009824020","https://openalex.org/W3018757597","https://openalex.org/W3034971973","https://openalex.org/W3134054343","https://openalex.org/W3159196909","https://openalex.org/W3171660447","https://openalex.org/W3205100603","https://openalex.org/W3205741456","https://openalex.org/W3210997334","https://openalex.org/W4224940354","https://openalex.org/W4226345051","https://openalex.org/W4239510810","https://openalex.org/W4248437541","https://openalex.org/W4296569553","https://openalex.org/W4306916543","https://openalex.org/W4311001968","https://openalex.org/W4318953537","https://openalex.org/W4320002812","https://openalex.org/W4382519713","https://openalex.org/W4385480830","https://openalex.org/W4385839827","https://openalex.org/W4387757656","https://openalex.org/W4388052496","https://openalex.org/W4400762160","https://openalex.org/W6620707391","https://openalex.org/W6676769703","https://openalex.org/W6750227808","https://openalex.org/W6849520326","https://openalex.org/W6858317486","https://openalex.org/W6947681574"],"related_works":["https://openalex.org/W2132659060","https://openalex.org/W2031992971","https://openalex.org/W3214791684","https://openalex.org/W4396860960","https://openalex.org/W2152662039","https://openalex.org/W4390482660","https://openalex.org/W2972256598","https://openalex.org/W2610408157","https://openalex.org/W4388813151","https://openalex.org/W2612465689"],"abstract_inverted_index":{"Owing":[0],"to":[1,32,72,95,164],"changes":[2],"in":[3,113],"the":[4,44,63,66,74,83,88,92,97,104,114,138,166,172,181,185,192,204,225],"spatial":[5,84],"position":[6],"of":[7,51,77,87,91,100,116,184,196,211,222,240],"Autonomous":[8],"Aerial":[9],"Vehicle":[10],"(AAV)":[11],"aerial":[12,21,53],"images":[13,54],"and":[14,28,40,102,131,141,170,174,194,200,213,224,232,235],"limited":[15],"platform":[16],"resources,":[17],"most":[18],"existing":[19],"AAV":[20,52],"image":[22],"detection":[23,38,49,75,89,98,176,182],"models":[24],"have":[25],"low":[26],"accuracy,":[27],"it":[29],"is":[30,60,70,118,162,208],"difficult":[31],"achieve":[33],"a":[34,107,122,132,146],"good":[35],"balance":[36],"between":[37],"performance":[39,99],"lightweight.":[41],"To":[42],"solve":[43],"above":[45],"problems,":[46],"an":[47,209],"object":[48],"model":[50,65,105],"based":[55,136],"on":[56,137,203],"YOLOv8s,":[57,218,241],"called":[58,129,160],"BSDS-YOLOv8s,":[59],"proposed.":[61],"In":[62],"proposed":[64,163],"Dynamic":[67],"Head":[68],"(DyHead)":[69],"used":[71],"replace":[73],"head":[76,90],"YOLOv8s":[78,117],"firstly,":[79],"which":[80,120],"can":[81],"improve":[82,96],"perception":[85],"ability":[86],"model.":[93,186],"Second,":[94],"DyHead":[101],"make":[103],"lightweight,":[106],"new":[108],"feature":[109,133],"pyramid":[110],"network":[111],"(SDI-MBiFPN)":[112],"Neck":[115],"proposed,":[119],"contains":[121],"Multiscale":[123],"Bidirectional":[124],"Feature":[125],"Pyramid":[126],"Network":[127],"(BiFPN),":[128],"MBiFPN,":[130],"fusion":[134],"method":[135,147],"redesigned":[139],"Semantic":[140],"Detail":[142],"Fusion":[143],"(SDI).":[144],"Finally,":[145],"that":[148,191],"integrates":[149],"Soft":[150],"Non-Maximum":[151],"Suppression":[152],"(Soft-NMS)":[153],"with":[154],"Generalized":[155],"Intersection":[156],"over":[157,217],"Union":[158],"(GIoU),":[159],"GIoU-Soft-NMS,":[161],"enhance":[165],"model\u2019s":[167],"post-processing":[168],"capability":[169],"reduce":[171],"missed":[173],"false":[175],"rates,":[177],"thereby":[178],"further":[179],"improving":[180],"accuracy":[183],"The":[187,220],"experimental":[188],"results":[189],"showed":[190],"mAP0.5":[193],"mAP0.5:0.95":[195],"BSDS-YOLOv8s":[197],"reached":[198],"49.6%":[199],"34.1%,":[201],"respectively,":[202],"VisDrone2019":[205],"dataset.":[206],"This":[207],"improvement":[210],"9.2":[212],"9.8":[214],"percentage":[215],"points":[216],"respectively.":[219,242],"number":[221],"parameters":[223],"floating":[226],"point":[227],"operations":[228],"(FLOPs)":[229],"were":[230],"8.03M":[231],"26.6G,":[233],"27.8%":[234],"7.6%":[236],"less":[237],"than":[238],"those":[239]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-03-05T00:00:00"}
