{"id":"https://openalex.org/W4402982680","doi":"https://doi.org/10.1109/icme57554.2024.10688108","title":"DSENet: An Object-Wise Density-Informed Coarse-to-Fine Object Detector for Aerial Image","display_name":"DSENet: An Object-Wise Density-Informed Coarse-to-Fine Object Detector for Aerial Image","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402982680","doi":"https://doi.org/10.1109/icme57554.2024.10688108"},"language":"en","primary_location":{"id":"doi:10.1109/icme57554.2024.10688108","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icme57554.2024.10688108","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101694703","display_name":"Haoran Jiang","orcid":"https://orcid.org/0009-0006-9575-3575"},"institutions":[{"id":"https://openalex.org/I113940042","display_name":"Shanghai University","ror":"https://ror.org/006teas31","country_code":"CN","type":"education","lineage":["https://openalex.org/I113940042"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoran Jiang","raw_affiliation_strings":["Shanghai University"],"affiliations":[{"raw_affiliation_string":"Shanghai University","institution_ids":["https://openalex.org/I113940042"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082986746","display_name":"Xiangjie Wang","orcid":"https://orcid.org/0009-0003-1241-5801"},"institutions":[{"id":"https://openalex.org/I113940042","display_name":"Shanghai University","ror":"https://ror.org/006teas31","country_code":"CN","type":"education","lineage":["https://openalex.org/I113940042"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangjie Wang","raw_affiliation_strings":["Shanghai University"],"affiliations":[{"raw_affiliation_string":"Shanghai University","institution_ids":["https://openalex.org/I113940042"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100343044","display_name":"Junjie Zhang","orcid":"https://orcid.org/0000-0002-0033-0494"},"institutions":[{"id":"https://openalex.org/I113940042","display_name":"Shanghai University","ror":"https://ror.org/006teas31","country_code":"CN","type":"education","lineage":["https://openalex.org/I113940042"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junjie Zhang","raw_affiliation_strings":["Shanghai University"],"affiliations":[{"raw_affiliation_string":"Shanghai University","institution_ids":["https://openalex.org/I113940042"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100409994","display_name":"Jian Zhang","orcid":"https://orcid.org/0000-0002-7240-3541"},"institutions":[{"id":"https://openalex.org/I113940042","display_name":"Shanghai University","ror":"https://ror.org/006teas31","country_code":"CN","type":"education","lineage":["https://openalex.org/I113940042"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Zhang","raw_affiliation_strings":["Shanghai University"],"affiliations":[{"raw_affiliation_string":"Shanghai University","institution_ids":["https://openalex.org/I113940042"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100456047","display_name":"Dan Zeng","orcid":"https://orcid.org/0000-0002-9036-7791"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Dan Zeng","raw_affiliation_strings":["University of Technology Sydney"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney","institution_ids":["https://openalex.org/I114017466"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101694703"],"corresponding_institution_ids":["https://openalex.org/I113940042"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16876518,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7062467932701111},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6695319414138794},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6577836275100708},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.6355182528495789},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6304293870925903},{"id":"https://openalex.org/keywords/aerial-image","display_name":"Aerial image","score":0.5929016470909119},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.525851309299469},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3942285180091858},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.33735617995262146},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.1803094446659088},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.11666443943977356}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7062467932701111},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6695319414138794},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6577836275100708},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.6355182528495789},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6304293870925903},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.5929016470909119},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.525851309299469},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3942285180091858},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.33735617995262146},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.1803094446659088},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.11666443943977356},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme57554.2024.10688108","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icme57554.2024.10688108","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","display_name":"Climate action","score":0.5699999928474426}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2463631526","https://openalex.org/W2586716774","https://openalex.org/W2962749812","https://openalex.org/W2963351448","https://openalex.org/W2963849369","https://openalex.org/W2989611864","https://openalex.org/W2996735448","https://openalex.org/W3036271496","https://openalex.org/W3116963012","https://openalex.org/W3118837087","https://openalex.org/W3170033848","https://openalex.org/W3208285567","https://openalex.org/W4312823573","https://openalex.org/W4313050697","https://openalex.org/W4385801363","https://openalex.org/W4386072246","https://openalex.org/W4390873076","https://openalex.org/W6750759024"],"related_works":["https://openalex.org/W4396860960","https://openalex.org/W4292830139","https://openalex.org/W4319309705","https://openalex.org/W2972256598","https://openalex.org/W4388813151","https://openalex.org/W2610408157","https://openalex.org/W2612465689","https://openalex.org/W4284972948","https://openalex.org/W4237245474","https://openalex.org/W2099047584"],"abstract_inverted_index":{"Object":[0],"detection":[1,53,97],"in":[2],"aerial":[3,143],"images":[4],"remains":[5],"formidable":[6],"due":[7],"to":[8],"substantial":[9],"object":[10,15,84],"scale":[11],"variations,":[12],"and":[13,40,52,86,105,126,147],"uneven":[14],"distributions.":[16],"Previous":[17],"methods":[18],"widely":[19],"adopt":[20],"the":[21,76,110,116],"coarse-to-fine":[22],"methodology":[23],"where":[24,127],"detectors":[25],"focus":[26],"on":[27,102,140],"large-scale":[28],"objects":[29],"coarsely.":[30],"Sub-regions":[31],"that":[32,81,135],"contain":[33],"densely":[34],"distributed":[35],"small":[36],"ones":[37],"are":[38,99,130],"captured":[39],"detected":[41],"finely.":[42],"However,":[43],"two":[44,141],"pivotal":[45],"assessment":[46],"factors":[47],"of":[48,115],"sub-regions,":[49],"positional":[50],"precision,":[51],"difficulty,":[54],"deserve":[55],"further":[56],"consideration.":[57],"In":[58],"this":[59],"paper,":[60],"we":[61],"propose":[62],"an":[63],"object-wise":[64,78],"density-informed":[65],"DSENet":[66,136],"including":[67],"consecutive":[68],"stages":[69],"termed":[70],"\"Discernment,":[71],"Selection,":[72],"Elevation":[73],"\".":[74],"Specifically,":[75],"sophisticated":[77],"density":[79,103],"map":[80],"considers":[82],"both":[83],"scales":[85],"angles,":[87],"helps":[88],"discern":[89],"more":[90],"positional-precise":[91],"sub-regions.":[92],"Then":[93],"sub-regions":[94,122],"with":[95,120],"high":[96],"difficulty":[98],"selected":[100,121],"based":[101],"intensities":[104],"coarse":[106,128],"detections":[107,129],"collaboratively.":[108],"Finally,":[109],"fine":[111],"detector":[112],"head":[113],"instead":[114],"full":[117],"detector,":[118],"fine-tuned":[119],"efficiently,":[123],"elevates":[124],"what":[125],"mediocre.":[131],"Extensive":[132],"experiments":[133],"show":[134],"achieves":[137],"state-of-the-art":[138],"performance":[139],"popular":[142],"image":[144],"datasets,":[145],"VisDrone":[146],"DOTA-V1.5.":[148]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
