{"id":"https://openalex.org/W4372260057","doi":"https://doi.org/10.1109/icassp49357.2023.10095995","title":"Pondering About Task Spatial Misalignment: Classification-Localization Equilibrated Object Detection","display_name":"Pondering About Task Spatial Misalignment: Classification-Localization Equilibrated Object Detection","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372260057","doi":"https://doi.org/10.1109/icassp49357.2023.10095995"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10095995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095995","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040898236","display_name":"Yudong Zhang","orcid":"https://orcid.org/0000-0003-4941-0214"},"institutions":[{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]},{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yudong Zhang","raw_affiliation_strings":["USTC,School of Data Science,Hefei,China","School of Data Science, USTC, Hefei, China","Suzhou Institute for Advanced Research, USTC, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"USTC,School of Data Science,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Data Science, USTC, Hefei, China","institution_ids":[]},{"raw_affiliation_string":"Suzhou Institute for Advanced Research, USTC, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100770898","display_name":"Wei L\u00fc","orcid":"https://orcid.org/0000-0001-6722-1527"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Lu","raw_affiliation_strings":["USTC,School of Software Engineering,Hefei,China","Suzhou Institute for Advanced Research, USTC, Suzhou, China","School of Software Engineering, USTC, Hefei, China"],"affiliations":[{"raw_affiliation_string":"USTC,School of Software Engineering,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Suzhou Institute for Advanced Research, USTC, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]},{"raw_affiliation_string":"School of Software Engineering, USTC, Hefei, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407848","display_name":"Xu Wang","orcid":"https://orcid.org/0000-0002-1492-3477"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Wang","raw_affiliation_strings":["USTC,School of Data Science,Hefei,China","School of Data Science, USTC, Hefei, China","Suzhou Institute for Advanced Research, USTC, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"USTC,School of Data Science,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Data Science, USTC, Hefei, China","institution_ids":[]},{"raw_affiliation_string":"Suzhou Institute for Advanced Research, USTC, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103006792","display_name":"Pengkun Wang","orcid":"https://orcid.org/0000-0002-2680-4563"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengkun Wang","raw_affiliation_strings":["USTC,School of Data Science,Hefei,China","Suzhou Institute for Advanced Research, USTC, Suzhou, China","School of Data Science, USTC, Hefei, China"],"affiliations":[{"raw_affiliation_string":"USTC,School of Data Science,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Suzhou Institute for Advanced Research, USTC, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]},{"raw_affiliation_string":"School of Data Science, USTC, Hefei, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5119268705","display_name":"Yang Wang","orcid":"https://orcid.org/0009-0002-1564-4434"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Wang","raw_affiliation_strings":["University of Science and Technology of China (USTC),Key Laboratory of Precision and Intelligent Chemistry,Hefei,China","School of Data Science, USTC, Hefei, China","Suzhou Institute for Advanced Research, USTC, Suzhou, China","School of Software Engineering, USTC, Hefei, China","Key Laboratory of Precision and Intelligent Chemistry, University of Science and Technology of China (USTC), Hefei, China","School of Computer Science and Technology, USTC, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China (USTC),Key Laboratory of Precision and Intelligent Chemistry,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Data Science, USTC, Hefei, China","institution_ids":[]},{"raw_affiliation_string":"Suzhou Institute for Advanced Research, USTC, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]},{"raw_affiliation_string":"School of Software Engineering, USTC, Hefei, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Precision and Intelligent Chemistry, University of Science and Technology of China (USTC), Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, USTC, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5040898236"],"corresponding_institution_ids":["https://openalex.org/I126520041","https://openalex.org/I4210125878"],"apc_list":null,"apc_paid":null,"fwci":0.2443,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.49892869,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7892974615097046},{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.7115469574928284},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6596888899803162},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6138674020767212},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5648747682571411},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5118152499198914},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.45967844128608704},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4547249376773834},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43198806047439575},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.42812132835388184},{"id":"https://openalex.org/keywords/extractor","display_name":"Extractor","score":0.42799174785614014},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.4238140881061554},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.33435487747192383},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08522859215736389},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.07415536046028137}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892974615097046},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.7115469574928284},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6596888899803162},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6138674020767212},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5648747682571411},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5118152499198914},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.45967844128608704},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4547249376773834},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43198806047439575},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.42812132835388184},{"id":"https://openalex.org/C117978034","wikidata":"https://www.wikidata.org/wiki/Q5422192","display_name":"Extractor","level":2,"score":0.42799174785614014},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.4238140881061554},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33435487747192383},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08522859215736389},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.07415536046028137},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C21880701","wikidata":"https://www.wikidata.org/wiki/Q2144042","display_name":"Process engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10095995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095995","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2031489346","https://openalex.org/W2193145675","https://openalex.org/W2194775991","https://openalex.org/W2549139847","https://openalex.org/W2570343428","https://openalex.org/W2884561390","https://openalex.org/W2886335102","https://openalex.org/W2886904239","https://openalex.org/W2950800384","https://openalex.org/W2952122856","https://openalex.org/W2962677013","https://openalex.org/W2962721361","https://openalex.org/W2963037989","https://openalex.org/W2963113370","https://openalex.org/W2963150697","https://openalex.org/W2963474687","https://openalex.org/W2963927307","https://openalex.org/W2964241181","https://openalex.org/W2982770724","https://openalex.org/W2986357608","https://openalex.org/W3034428269","https://openalex.org/W3035473155","https://openalex.org/W3102710196","https://openalex.org/W3106250896","https://openalex.org/W3108849448","https://openalex.org/W4293584584","https://openalex.org/W4297775537"],"related_works":["https://openalex.org/W4376620596","https://openalex.org/W3177249605","https://openalex.org/W2534152068","https://openalex.org/W3138508047","https://openalex.org/W1972515067","https://openalex.org/W1689909837","https://openalex.org/W4293054914","https://openalex.org/W4298525700","https://openalex.org/W2953362004","https://openalex.org/W2549121492"],"abstract_inverted_index":{"Object":[0],"detection":[1],"is":[2],"a":[3,58,75,106,126],"fundamental":[4],"task":[5],"in":[6,57,99],"computer":[7],"vision,":[8],"consisting":[9],"of":[10,34,64,87],"both":[11],"classification":[12,20,35,88],"and":[13,21,36,66,83,89,135],"localization":[14,22,37,90,120],"tasks.":[15,91],"Previous":[16],"works":[17],"mostly":[18],"perform":[19],"with":[23,41,149],"shared":[24],"feature":[25],"extractor":[26],"like":[27],"Convolution":[28],"Neural":[29],"Network.":[30],"However,":[31],"the":[32,44,48,62,85,119],"tasks":[33],"exhibit":[38],"different":[39],"sensitivities":[40],"regard":[42],"to":[43,80,111],"same":[45],"feature,":[46],"hence":[47],"\"task":[49],"spatial":[50],"misalignment\"":[51],"issue.":[52],"This":[53],"issue":[54,60,98],"can":[55,142],"result":[56],"hedge":[59],"between":[61],"performances":[63,86],"localizer":[65],"classifier.":[67],"To":[68,92],"address":[69,94],"these":[70],"issues,":[71],"we":[72,104,116],"first":[73],"propose":[74],"novel":[76],"Dynamic":[77],"Coefficient":[78],"Loss":[79],"simultaneously":[81],"consider":[82],"balance":[84],"well":[93],"anchor":[95],"label":[96],"misjudgment":[97],"irregular-":[100],"shaped":[101],"object":[102],"detection,":[103],"define":[105],"new":[107],"classification-aware":[108],"IoU":[109],"metric":[110],"assign":[112],"anchors":[113],"intelligently.":[114],"Finally,":[115],"further":[117],"introduce":[118],"factor":[121],"into":[122],"NMS":[123],"by":[124,145],"proposing":[125],"Classification-Localization":[127],"balanced":[128],"NMS.":[129],"Extensive":[130],"experiments":[131],"on":[132],"MS":[133],"COCO":[134],"PASCAL":[136],"VOC":[137],"demonstrate":[138],"that":[139],"our":[140],"proposals":[141],"improve":[143],"RetinaNet":[144],"around":[146],"1.5%":[147],"AP":[148],"various":[150],"backbones.":[151]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2025-10-10T00:00:00"}
