{"id":"https://openalex.org/W4416251787","doi":"https://doi.org/10.1109/ijcnn64981.2025.11227609","title":"YOLO-Wide: A Complex Background Small Object Detection Network for Wide-Field High-Resolution Cameras","display_name":"YOLO-Wide: A Complex Background Small Object Detection Network for Wide-Field High-Resolution Cameras","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416251787","doi":"https://doi.org/10.1109/ijcnn64981.2025.11227609"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11227609","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11227609","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100373745","display_name":"Xiaohong Chen","orcid":"https://orcid.org/0000-0002-9797-8384"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaomin Chen","raw_affiliation_strings":["Sun Yat-Sen University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-Sen University,Shenzhen,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100333738","display_name":"Yue Zhang","orcid":"https://orcid.org/0000-0002-6327-5023"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Zhang","raw_affiliation_strings":["Sun Yat-Sen University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-Sen University,Shenzhen,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101406275","display_name":"Zengping Chen","orcid":"https://orcid.org/0000-0002-2892-8252"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zengping Chen","raw_affiliation_strings":["Sun Yat-Sen University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-Sen University,Shenzhen,China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100373745"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37516949,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8910999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8910999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.018400000408291817,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.009600000455975533,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7419999837875366},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.6847000122070312},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.6786999702453613},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5781999826431274},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5414999723434448},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.49300000071525574},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.4733000099658966},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.46880000829696655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7681000232696533},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7419999837875366},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7031999826431274},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6930999755859375},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.6847000122070312},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.6786999702453613},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5781999826431274},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5414999723434448},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.49300000071525574},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.4733000099658966},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.4449999928474426},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.44279998540878296},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.40610000491142273},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32839998602867126},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.32600000500679016},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.3248000144958496},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11227609","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11227609","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2752782242","https://openalex.org/W2962749812","https://openalex.org/W2963351448","https://openalex.org/W2963566548","https://openalex.org/W2963857746","https://openalex.org/W2989604896","https://openalex.org/W2990763144","https://openalex.org/W3012573144","https://openalex.org/W3022917557","https://openalex.org/W3034552520","https://openalex.org/W3034959114","https://openalex.org/W3035396860","https://openalex.org/W3042916480","https://openalex.org/W3111218342","https://openalex.org/W3205100603","https://openalex.org/W3210586215","https://openalex.org/W4214507171","https://openalex.org/W4289752563","https://openalex.org/W4382568144","https://openalex.org/W4390873058","https://openalex.org/W4394596865","https://openalex.org/W4403770406","https://openalex.org/W4415795831"],"related_works":[],"abstract_inverted_index":{"Wide-field":[0,49],"high-resolution":[1,50],"cameras":[2],"are":[3,173],"advanced":[4],"imaging":[5],"devices":[6],"with":[7],"a":[8,112,199],"wide":[9],"field":[10],"of":[11,43,79,105,158,190],"view":[12],"and":[13,31,39,129],"high":[14],"resolution.":[15],"However,":[16],"in":[17,73,135,151],"practical":[18],"applications,":[19],"they":[20],"encounter":[21],"several":[22],"challenges,":[23],"such":[24],"as":[25],"small":[26,45,80,168],"object":[27,29],"scale,":[28],"occlusion,":[30],"complex":[32,106],"background":[33],"interference.":[34],"To":[35],"address":[36],"these":[37],"issues":[38],"enable":[40],"effective":[41],"detection":[42,77,109,161],"distant":[44],"ground":[46],"targets":[47],"by":[48,144],"cameras,":[51],"this":[52],"paper":[53],"proposes":[54],"the":[55,62,69,76,83,92,98,103,124,132,136,139,148,156,159,176,185,193,203],"YOLO-Wide":[56,186],"method":[57],"based":[58,116],"on":[59,97,108,117,175,192],"YOLOv11n.":[60,205],"First,":[61],"Dysample":[63],"module":[64,72,115],"is":[65,89,120,142,163,198],"introduced":[66,121],"to":[67,94,122,165],"replace":[68],"traditional":[70],"upsampling":[71],"YOLOv11n,":[74],"enhancing":[75],"capability":[78,128],"objects.":[81],"Secondly,":[82],"Deformable":[84],"Dual":[85],"Attention":[86],"Module":[87],"(DDAM)":[88],"proposed,":[90],"enabling":[91],"model":[93],"better":[95],"focus":[96],"target":[99],"region,":[100],"effectively":[101],"suppressing":[102],"interference":[104],"backgrounds":[107],"results.":[110],"Third,":[111],"residual":[113],"connection":[114],"ODConv":[118],"(ODConv-ResBlock)":[119],"improve":[123],"model\u2019s":[125,149],"feature":[126,179],"extraction":[127],"fully":[130],"explore":[131],"semantic":[133],"information":[134],"image.":[137],"Fourth,":[138],"loss":[140],"function":[141],"optimized":[143],"using":[145],"FocalerCIoU,":[146],"improving":[147],"accuracy":[150],"bounding":[152],"box":[153],"localization.":[154],"Finally,":[155],"position":[157],"network":[160],"head":[162],"adjusted":[164],"ensure":[166],"that":[167,184],"objects":[169],"at":[170],"different":[171],"scales":[172],"processed":[174],"most":[177],"suitable":[178],"maps.":[180],"Experimental":[181],"results":[182],"show":[183],"achieves":[187],"an":[188],"mAP@0.5":[189],"89.4%":[191],"custom":[194],"dataset,":[195],"Small-Ground,":[196],"which":[197],"9.1%":[200],"improvement":[201],"over":[202],"baseline":[204]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-14T00:00:00"}
