{"id":"https://openalex.org/W4386838484","doi":"https://doi.org/10.3390/rs15184580","title":"SMFF-YOLO: A Scale-Adaptive YOLO Algorithm with Multi-Level Feature Fusion for Object Detection in UAV Scenes","display_name":"SMFF-YOLO: A Scale-Adaptive YOLO Algorithm with Multi-Level Feature Fusion for Object Detection in UAV Scenes","publication_year":2023,"publication_date":"2023-09-17","ids":{"openalex":"https://openalex.org/W4386838484","doi":"https://doi.org/10.3390/rs15184580"},"language":"en","primary_location":{"id":"doi:10.3390/rs15184580","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15184580","pdf_url":"https://www.mdpi.com/2072-4292/15/18/4580/pdf?version=1695008836","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2072-4292/15/18/4580/pdf?version=1695008836","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030863313","display_name":"Yuming Wang","orcid":"https://orcid.org/0000-0002-1602-6868"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210119942","display_name":"Wuhan Textile University","ror":"https://ror.org/02jgsf398","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210119942"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuming Wang","raw_affiliation_strings":["School of Computer Science, Wuhan University, Wuhan 430072, China","School of Electronic and Electrical Engineering, Wuhan Textile University, Wuhan 430077, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Wuhan University, Wuhan 430072, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Electronic and Electrical Engineering, Wuhan Textile University, Wuhan 430077, China","institution_ids":["https://openalex.org/I4210119942"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043300518","display_name":"Hua Zou","orcid":"https://orcid.org/0000-0002-3641-2686"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hua Zou","raw_affiliation_strings":["School of Computer Science, Wuhan University, Wuhan 430072, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Wuhan University, Wuhan 430072, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029969492","display_name":"Ming Yin","orcid":"https://orcid.org/0000-0002-6785-1649"},"institutions":[{"id":"https://openalex.org/I4210119942","display_name":"Wuhan Textile University","ror":"https://ror.org/02jgsf398","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210119942"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Yin","raw_affiliation_strings":["School of Electronic and Electrical Engineering, Wuhan Textile University, Wuhan 430077, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Electrical Engineering, Wuhan Textile University, Wuhan 430077, China","institution_ids":["https://openalex.org/I4210119942"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101508701","display_name":"Xining Zhang","orcid":"https://orcid.org/0000-0002-9426-6453"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xining Zhang","raw_affiliation_strings":["School of Computer Science, Wuhan University, Wuhan 430072, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Wuhan University, Wuhan 430072, China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5043300518"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":{"value":2500,"currency":"CHF","value_usd":2707},"apc_paid":{"value":2500,"currency":"CHF","value_usd":2707},"fwci":6.5415,"has_fulltext":true,"cited_by_count":53,"citation_normalized_percentile":{"value":0.9775491,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"15","issue":"18","first_page":"4580","last_page":"4580"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7907942533493042},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7198123335838318},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6268583536148071},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5920282602310181},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5870741009712219},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.5534300804138184},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.5093072652816772},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5037731528282166},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.4999876022338867},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.47620758414268494},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4413226246833801},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37772268056869507},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.23277905583381653},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0728088915348053},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.06607767939567566}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7907942533493042},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7198123335838318},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6268583536148071},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5920282602310181},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5870741009712219},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.5534300804138184},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.5093072652816772},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5037731528282166},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.4999876022338867},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.47620758414268494},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4413226246833801},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37772268056869507},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.23277905583381653},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0728088915348053},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.06607767939567566},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/rs15184580","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15184580","pdf_url":"https://www.mdpi.com/2072-4292/15/18/4580/pdf?version=1695008836","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b7dc26eaef584136bfc341b23816d031","is_oa":true,"landing_page_url":"https://doaj.org/article/b7dc26eaef584136bfc341b23816d031","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing, Vol 15, Iss 18, p 4580 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/rs15184580","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15184580","pdf_url":"https://www.mdpi.com/2072-4292/15/18/4580/pdf?version=1695008836","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.6399999856948853,"display_name":"Sustainable cities and communities"}],"awards":[{"id":"https://openalex.org/G2506566822","display_name":null,"funder_award_id":"U1903214","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4386838484.pdf"},"referenced_works_count":56,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2037227137","https://openalex.org/W2102605133","https://openalex.org/W2109255472","https://openalex.org/W2163605009","https://openalex.org/W2193145675","https://openalex.org/W2565639579","https://openalex.org/W2608264083","https://openalex.org/W2613718673","https://openalex.org/W2797090510","https://openalex.org/W2884585870","https://openalex.org/W2929738993","https://openalex.org/W2936599103","https://openalex.org/W2941472577","https://openalex.org/W2962777203","https://openalex.org/W2962850098","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W2963351448","https://openalex.org/W2963857746","https://openalex.org/W2964241181","https://openalex.org/W2964309882","https://openalex.org/W2972006294","https://openalex.org/W2972877657","https://openalex.org/W2995199175","https://openalex.org/W2997747012","https://openalex.org/W3012573144","https://openalex.org/W3034552520","https://openalex.org/W3034971973","https://openalex.org/W3036271496","https://openalex.org/W3088979451","https://openalex.org/W3096609285","https://openalex.org/W3106250896","https://openalex.org/W3116963012","https://openalex.org/W3122173535","https://openalex.org/W3138516171","https://openalex.org/W3175630421","https://openalex.org/W3176346992","https://openalex.org/W3198011468","https://openalex.org/W3205100603","https://openalex.org/W3208019692","https://openalex.org/W3208285567","https://openalex.org/W3210586215","https://openalex.org/W3211328899","https://openalex.org/W4206294875","https://openalex.org/W4220859115","https://openalex.org/W4226410580","https://openalex.org/W4281719556","https://openalex.org/W4297549407","https://openalex.org/W4328125637","https://openalex.org/W4386075524","https://openalex.org/W4386076079","https://openalex.org/W4386076325","https://openalex.org/W6761306150","https://openalex.org/W6770715449","https://openalex.org/W6810626455"],"related_works":["https://openalex.org/W3094187672","https://openalex.org/W3211653591","https://openalex.org/W2766547489","https://openalex.org/W3197089899","https://openalex.org/W2756241593","https://openalex.org/W2894878591","https://openalex.org/W3015973434","https://openalex.org/W3034296931","https://openalex.org/W4386099271","https://openalex.org/W2937816158"],"abstract_inverted_index":{"Object":[0],"detection":[1,65,76,94,196],"in":[2,13,114],"images":[3],"captured":[4],"by":[5,117],"unmanned":[6],"aerial":[7],"vehicles":[8],"(UAVs)":[9],"holds":[10],"great":[11],"potential":[12],"various":[14],"domains,":[15],"including":[16],"civilian":[17],"applications,":[18],"urban":[19],"planning,":[20],"and":[21,37,89,140,185,204,220],"disaster":[22],"response.":[23],"However,":[24],"it":[25],"faces":[26],"several":[27],"challenges,":[28],"such":[29],"as":[30],"multi-scale":[31,119],"variations,":[32],"dense":[33],"scenes,":[34],"complex":[35,123],"backgrounds,":[36,124],"tiny-sized":[38],"objects.":[39,98],"In":[40],"this":[41],"paper,":[42],"we":[43,125,149],"present":[44],"a":[45,57,170],"novel":[46],"scale-adaptive":[47],"YOLO":[48],"framework":[49,71,169],"called":[50],"SMFF-YOLO,":[51],"which":[52,135,166],"addresses":[53],"these":[54],"challenges":[55],"through":[56],"multi-level":[58],"feature":[59,103,138],"fusion":[60,104,139],"approach.":[61,224],"To":[62,121],"improve":[63],"the":[64,73,93,100,109,127,142,151,159,168,178,183,218],"accuracy":[66,95],"of":[67,96,111,145,161,180,222],"small":[68],"objects,":[69],"our":[70,192,223],"incorporates":[72],"ELAN-SW":[74],"object":[75,115],"prediction":[77],"head.":[78],"This":[79],"newly":[80],"designed":[81],"head":[82],"effectively":[83],"utilizes":[84],"both":[85],"global":[86],"contextual":[87],"information":[88],"local":[90],"features,":[91],"enhancing":[92],"tiny":[97],"Additionally,":[99],"proposed":[101],"bidirectional":[102],"pyramid":[105,131],"(BFFP)":[106],"module":[107],"tackles":[108],"issue":[110],"scale":[112],"variations":[113],"sizes":[116],"aggregating":[118],"features.":[120],"handle":[122],"introduce":[126],"adaptive":[128,137],"atrous":[129],"spatial":[130],"pooling":[132],"(AASPP)":[133],"module,":[134],"enables":[136],"alleviates":[141],"negative":[143],"impact":[144],"cluttered":[146],"scenes.":[147],"Moreover,":[148],"adopt":[150],"Wise-IoU(WIoU)":[152],"bounding":[153],"box":[154],"regression":[155],"loss":[156],"to":[157],"enhance":[158],"competitiveness":[160],"different":[162],"quality":[163],"anchor":[164],"boxes,":[165],"offers":[167],"more":[171],"informed":[172],"gradient":[173],"allocation":[174],"strategy.":[175],"We":[176],"validate":[177],"effectiveness":[179],"SMFF-YOLO":[181],"using":[182],"VisDrone":[184,203],"UAVDT":[186,207],"datasets.":[187,208],"Experimental":[188],"results":[189],"demonstrate":[190],"that":[191],"model":[193],"achieves":[194],"higher":[195],"accuracy,":[197],"with":[198,212],"AP50":[199],"reaching":[200],"54.3%":[201],"for":[202,206],"42.4%":[205],"Visual":[209],"comparative":[210],"experiments":[211],"other":[213],"YOLO-based":[214],"methods":[215],"further":[216],"illustrate":[217],"robustness":[219],"adaptability":[221]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":30},{"year":2024,"cited_by_count":17},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
