{"id":"https://openalex.org/W7147103577","doi":"https://doi.org/10.1109/icvisp68610.2025.11451239","title":"Attention-SBA YOLOv11: UAV Small Object Detection with Attention and Boundary Aggregation","display_name":"Attention-SBA YOLOv11: UAV Small Object Detection with Attention and Boundary Aggregation","publication_year":2025,"publication_date":"2025-11-28","ids":{"openalex":"https://openalex.org/W7147103577","doi":"https://doi.org/10.1109/icvisp68610.2025.11451239"},"language":null,"primary_location":{"id":"doi:10.1109/icvisp68610.2025.11451239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451239","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080051025","display_name":"Z. Jane Wang","orcid":"https://orcid.org/0009-0006-6717-4357"},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zilong Wang","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074051673","display_name":"Z. Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zixiang Liu","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106732380","display_name":"Xinyao Liu","orcid":"https://orcid.org/0009-0005-8645-8702"},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyao Liu","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051615382","display_name":"Y. Han","orcid":"https://orcid.org/0000-0002-3510-6505"},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingying Han","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132686872","display_name":"Ting Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Chen","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5132609592","display_name":"Tao Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I25355098","display_name":"Chang'an University","ror":"https://ror.org/05mxya461","country_code":"CN","type":"education","lineage":["https://openalex.org/I25355098"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Gao","raw_affiliation_strings":["Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Chang&#x2019;an University,School of Information Engineering,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I25355098"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5080051025"],"corresponding_institution_ids":["https://openalex.org/I25355098"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.74871269,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9527999758720398,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9527999758720398,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.00559999980032444,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.004399999976158142,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7639999985694885},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6506999731063843},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6406999826431274},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.6000000238418579},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.5400000214576721},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5310999751091003},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5063999891281128},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5059999823570251},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5004000067710876}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7639999985694885},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7178999781608582},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6506999731063843},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6407999992370605},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6406999826431274},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.6000000238418579},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5587000250816345},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.5400000214576721},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5310999751091003},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5063999891281128},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5059999823570251},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5004000067710876},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4918000102043152},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.45820000767707825},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4544000029563904},{"id":"https://openalex.org/C193536780","wikidata":"https://www.wikidata.org/wiki/Q1513153","display_name":"Edge detection","level":4,"score":0.446399986743927},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4242999851703644},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.4203000068664551},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.37880000472068787},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.3643999993801117},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.31949999928474426},{"id":"https://openalex.org/C87360688","wikidata":"https://www.wikidata.org/wiki/Q740686","display_name":"Synthetic aperture radar","level":2,"score":0.31630000472068787},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26350000500679016},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.2605000138282776},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icvisp68610.2025.11451239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451239","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7890669107437134}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W2193145675","https://openalex.org/W2963351448","https://openalex.org/W2964241181","https://openalex.org/W4214507171","https://openalex.org/W4391974567","https://openalex.org/W4396738701","https://openalex.org/W4401856303","https://openalex.org/W4401887491","https://openalex.org/W4402754006","https://openalex.org/W4404501926","https://openalex.org/W4404696402","https://openalex.org/W4415795831"],"related_works":[],"abstract_inverted_index":{"In":[0],"UAV":[1,140],"aerial":[2],"imagery,":[3],"small":[4],"objects,":[5],"dense":[6],"target":[7,105],"distributions,":[8],"and":[9,23,30,62,98,107,137],"complex":[10],"backgrounds":[11],"significantly":[12],"constrain":[13],"performance":[14],"of":[15,135],"object":[16],"detection":[17],"models,":[18],"particularly":[19],"regarding":[20],"feature":[21,32,77],"extraction":[22],"localization":[24],"accuracy.":[25],"To":[26,79],"mitigate":[27],"boundary":[28,52,67],"ambiguity":[29],"inadequate":[31],"representation":[33],"in":[34,139],"YOLOv11":[35,117],"for":[36],"UAV-based":[37],"small-object":[38,141],"detection,":[39],"this":[40],"study":[41],"introduces":[42],"a":[43,82],"Structural":[44],"Boundary":[45],"Aggregation":[46],"(SBA)":[47],"module.":[48],"SBA":[49,136],"integrates":[50],"shallow":[51],"features":[53],"with":[54],"deep":[55],"semantic":[56],"information":[57],"to":[58,91,125],"enhance":[59],"edge":[60],"sensitivity":[61],"improve":[63],"boundary-region":[64],"representation.":[65],"However,":[66],"enhancement":[68],"alone":[69],"cannot":[70],"fully":[71],"suppress":[72],"background":[73],"interference":[74],"or":[75],"alleviate":[76],"redundancy.":[78],"address":[80],"this,":[81],"Channel":[83],"Prior":[84],"Convolutional":[85],"Attention":[86],"(CPCA)":[87],"module":[88],"is":[89],"incorporated":[90],"adaptively":[92],"assign":[93],"dynamic":[94],"weights":[95],"across":[96],"channel":[97],"spatial":[99],"dimensions,":[100],"enabling":[101],"focus":[102],"on":[103,112],"critical":[104],"areas":[106],"strengthening":[108],"discriminative":[109],"capability.":[110],"Experiments":[111],"VISDRONE2019-DET":[113],"demonstrate":[114],"that":[115],"Attention-SBA":[116],"improves":[118],"mean":[119],"Average":[120],"Precision":[121],"(mAP)":[122],"from":[123],"0.44":[124],"0.455":[126],"while":[127],"maintaining":[128],"high":[129],"inference":[130],"speed,":[131],"validating":[132],"complementary":[133],"benefits":[134],"CPCA":[138],"detection.":[142]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-04-02T00:00:00"}
