{"id":"https://openalex.org/W4412446203","doi":"https://doi.org/10.1109/dsp65409.2025.11075181","title":"Expand to Detect: Enlarging Bounding Box Annotations for Small Object Detection","display_name":"Expand to Detect: Enlarging Bounding Box Annotations for Small Object Detection","publication_year":2025,"publication_date":"2025-06-25","ids":{"openalex":"https://openalex.org/W4412446203","doi":"https://doi.org/10.1109/dsp65409.2025.11075181"},"language":"en","primary_location":{"id":"doi:10.1109/dsp65409.2025.11075181","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsp65409.2025.11075181","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 25th International Conference on Digital Signal Processing (DSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002132225","display_name":"Mustafa U\u011fur","orcid":"https://orcid.org/0000-0003-3472-2311"},"institutions":[{"id":"https://openalex.org/I48912391","display_name":"Istanbul Technical University","ror":"https://ror.org/059636586","country_code":"TR","type":"education","lineage":["https://openalex.org/I48912391"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Mustafa U\u011fur","raw_affiliation_strings":["Istanbul Technical University,Department of Computer Engineering,Istanbul,T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Istanbul Technical University,Department of Computer Engineering,Istanbul,T&#x00FC;rkiye","institution_ids":["https://openalex.org/I48912391"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009982931","display_name":"Haz\u0131m Kemal Ekenel","orcid":"https://orcid.org/0000-0003-3697-8548"},"institutions":[{"id":"https://openalex.org/I48912391","display_name":"Istanbul Technical University","ror":"https://ror.org/059636586","country_code":"TR","type":"education","lineage":["https://openalex.org/I48912391"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Hazim Kemal Ekenel","raw_affiliation_strings":["Istanbul Technical University,Department of Computer Engineering,Istanbul,T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Istanbul Technical University,Department of Computer Engineering,Istanbul,T&#x00FC;rkiye","institution_ids":["https://openalex.org/I48912391"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5002132225"],"corresponding_institution_ids":["https://openalex.org/I48912391"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19526404,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.8212969303131104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7577773928642273},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.6555100679397583},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6027694344520569},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5338296294212341},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4620043933391571},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4143785238265991},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3507540225982666},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.23224538564682007},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.10676053166389465}],"concepts":[{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.8212969303131104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7577773928642273},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.6555100679397583},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6027694344520569},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5338296294212341},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4620043933391571},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4143785238265991},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3507540225982666},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.23224538564682007},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.10676053166389465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dsp65409.2025.11075181","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsp65409.2025.11075181","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 25th International Conference on Digital Signal Processing (DSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2579152745","https://openalex.org/W2913012218","https://openalex.org/W2963037989","https://openalex.org/W2992240579","https://openalex.org/W3096609285","https://openalex.org/W3118718721","https://openalex.org/W3119129845","https://openalex.org/W3160733999","https://openalex.org/W3183824707","https://openalex.org/W3210586215","https://openalex.org/W3210997132","https://openalex.org/W4207034821","https://openalex.org/W4225493839","https://openalex.org/W4307411363","https://openalex.org/W4375809357","https://openalex.org/W4385801363","https://openalex.org/W4402754006","https://openalex.org/W6658049321","https://openalex.org/W6804453918","https://openalex.org/W6810913163"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Detecting":[0],"small":[1,37,96,120],"objects,":[2,38],"those":[3],"with":[4],"<tex":[5],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[6],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$32":[7],"\\times":[8],"32$</tex>":[9],"pixels":[10],"or":[11],"smaller,":[12],"remains":[13],"a":[14],"challenging":[15],"task":[16],"in":[17,88,108],"aerial":[18,124],"imagery":[19],"due":[20],"to":[21,55],"limited":[22],"resolution":[23],"and":[24,43,61,102],"contextual":[25,59,117],"information.":[26],"In":[27],"this":[28,51],"study,":[29],"we":[30,53],"propose":[31],"enlarging":[32],"bounding":[33],"box":[34],"annotations":[35,80],"for":[36,95,119],"thereby":[39],"integrating":[40],"additional":[41],"shape":[42,64],"spatial":[44],"context":[45],"into":[46],"the":[47,58,67,73,112],"training":[48,68],"process.":[49,69],"With":[50],"approach,":[52],"seek":[54],"reinforce":[56],"both":[57],"information":[60,118],"leverage":[62],"object":[63,97,121],"characteristics":[65],"during":[66],"Experiments":[70],"conducted":[71],"on":[72],"VisDrone":[74],"dataset":[75],"demonstrate":[76],"that":[77],"using":[78],"expanded":[79],"yields":[81],"an":[82],"absolute":[83],"improvement":[84],"of":[85,114],"approximately":[86],"10%":[87],"mean":[89],"average":[90,109],"precision.":[91],"Notably,":[92],"detection":[93,122],"accuracy":[94],"classes,":[98],"such":[99],"as":[100],"pedestrians":[101],"motors,":[103],"improves":[104],"by":[105],"over":[106],"20%":[107],"precision,":[110],"highlighting":[111],"benefit":[113],"including":[115],"surrounding":[116],"from":[123],"images.":[125]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
