{"id":"https://openalex.org/W3194790201","doi":"https://doi.org/10.1109/tcyb.2021.3095305","title":"Enhancing Geometric Factors in Model Learning and Inference for Object Detection and Instance Segmentation","display_name":"Enhancing Geometric Factors in Model Learning and Inference for Object Detection and Instance Segmentation","publication_year":2021,"publication_date":"2021-08-26","ids":{"openalex":"https://openalex.org/W3194790201","doi":"https://doi.org/10.1109/tcyb.2021.3095305","mag":"3194790201","pmid":"https://pubmed.ncbi.nlm.nih.gov/34437079"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2021.3095305","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2021.3095305","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101740169","display_name":"Zhaohui Zheng","orcid":"https://orcid.org/0000-0002-7664-2363"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaohui Zheng","raw_affiliation_strings":["School of Mathematics, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ping Wang","orcid":"https://orcid.org/0000-0001-9339-1829"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Wang","raw_affiliation_strings":["School of Mathematics, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051402211","display_name":"Dongwei Ren","orcid":"https://orcid.org/0000-0002-0965-6810"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongwei Ren","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431792","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3865-8145"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Tianjin Key Laboratory of Machine Learning, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Machine Learning, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067337261","display_name":"Rongguang Ye","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongguang Ye","raw_affiliation_strings":["School of Mathematics, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056686459","display_name":"Qinghua Hu","orcid":"https://orcid.org/0000-0001-7765-8095"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qinghua Hu","raw_affiliation_strings":["Tianjin Key Laboratory of Machine Learning, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Machine Learning, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100636655","display_name":"Wangmeng Zuo","orcid":"https://orcid.org/0000-0002-3330-783X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wangmeng Zuo","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101740169"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":81.28,"has_fulltext":false,"cited_by_count":1354,"citation_normalized_percentile":{"value":0.99962843,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"52","issue":"8","first_page":"8574","last_page":"8586"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8238558769226074},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.7639975547790527},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.695636510848999},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6762934327125549},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6656308770179749},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6639694571495056},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6580120325088501},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5793267488479614},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5265945196151733},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.5192280411720276},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5075875520706177},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4902504086494446},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22954586148262024},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.186740905046463},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1266222596168518}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8238558769226074},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.7639975547790527},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.695636510848999},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6762934327125549},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6656308770179749},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6639694571495056},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6580120325088501},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5793267488479614},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5265945196151733},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.5192280411720276},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5075875520706177},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4902504086494446},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22954586148262024},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.186740905046463},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1266222596168518}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2021.3095305","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2021.3095305","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:34437079","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34437079","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1068922776","display_name":null,"funder_award_id":"U19A2073","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5576762974","display_name":null,"funder_award_id":"61801326","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1932624639","https://openalex.org/W2031489346","https://openalex.org/W2046033161","https://openalex.org/W2058757422","https://openalex.org/W2102605133","https://openalex.org/W2158688659","https://openalex.org/W2168356304","https://openalex.org/W2403089842","https://openalex.org/W2504335775","https://openalex.org/W2570343428","https://openalex.org/W2579985080","https://openalex.org/W2593539516","https://openalex.org/W2725486421","https://openalex.org/W2768909086","https://openalex.org/W2783231089","https://openalex.org/W2798355657","https://openalex.org/W2806070179","https://openalex.org/W2883406652","https://openalex.org/W2884561390","https://openalex.org/W2885605338","https://openalex.org/W2886904239","https://openalex.org/W2888527098","https://openalex.org/W2904746319","https://openalex.org/W2915315630","https://openalex.org/W2916798096","https://openalex.org/W2949708697","https://openalex.org/W2962677013","https://openalex.org/W2962721361","https://openalex.org/W2962766617","https://openalex.org/W2963037989","https://openalex.org/W2963113370","https://openalex.org/W2963402592","https://openalex.org/W2963727135","https://openalex.org/W2963769056","https://openalex.org/W2963998989","https://openalex.org/W2964121718","https://openalex.org/W2964241181","https://openalex.org/W2964294787","https://openalex.org/W2981969038","https://openalex.org/W2982161360","https://openalex.org/W2982770724","https://openalex.org/W2986357608","https://openalex.org/W2993182889","https://openalex.org/W2997747012","https://openalex.org/W3009246422","https://openalex.org/W3034681942","https://openalex.org/W3034826836","https://openalex.org/W3035672751","https://openalex.org/W3106228955","https://openalex.org/W3190261797","https://openalex.org/W4293584584"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Deep":[0],"learning-based":[1],"object":[2,79,187,217],"detection":[3,80,188],"and":[4,19,29,41,67,81,112,123,141,156,166,173,184,186,193,213,219,222,241],"instance":[5,82,180,226],"segmentation":[6,181],"have":[7,175],"achieved":[8],"unprecedented":[9],"progress.":[10],"In":[11,51,168],"this":[12],"article,":[13],"we":[14,53,127],"propose":[15,128],"complete-IoU":[16],"(CIoU)":[17],"loss":[18,93,107,122,172],"Cluster-NMS":[20,146,174],"for":[21,74,94,216,225],"enhancing":[22],"geometric":[23,56,86,157],"factors":[24,87,158],"in":[25,78,109,115],"both":[26,164],"bounding-box":[27,76],"regression":[28,77,98],"nonmaximum":[30],"suppression":[31],"(NMS),":[32],"leading":[33],"to":[34,117,151,162,178],"notable":[35],"gains":[36,209],"of":[37,48,102],"average":[38,42],"precision":[39],"(AP)":[40],"recall":[43],"(AR),":[44],"without":[45],"the":[46,169,238],"sacrifice":[47],"inference":[49,133],"efficiency.":[50],"particular,":[52],"consider":[54],"three":[55,85],"factors,":[57],"that":[58],"is:":[59],"1)":[60],"overlap":[61],"area;":[62],"2)":[63],"normalized":[64],"central-point":[65],"distance;":[66],"3)":[68],"aspect":[69],"ratio,":[70],"which":[71],"are":[72,88,244],"crucial":[73],"measuring":[75],"segmentation.":[83],"The":[84,100],"then":[89],"incorporated":[90,161],"into":[91],"CIoU":[92,106,171],"better":[95],"distinguishing":[96],"difficult":[97],"cases.":[99],"training":[101],"deep":[103],"models":[104,243],"using":[105],"results":[108],"consistent":[110],"AP":[111,165,212,221],"AR":[113],"improvements":[114],"comparison":[116],"widely":[118],"adopted":[119],"l<sub>n</sub>":[120],"-norm":[121],"IoU-based":[124],"loss.":[125],"Furthermore,":[126],"Cluster-NMS,":[129],"where":[130],"NMS":[131],"during":[132],"is":[134,147],"done":[135],"by":[136],"implicitly":[137],"clustering":[138],"detected":[139],"boxes":[140],"usually":[142],"requires":[143],"fewer":[144],"iterations.":[145],"very":[148],"efficient":[149],"due":[150],"its":[152],"pure":[153],"GPU":[154],"implementation,":[155],"can":[159],"be":[160],"improve":[163],"AR.":[167],"experiments,":[170],"been":[176],"applied":[177],"state-of-the-art":[179],"(e.g.,":[182,189],"YOLACT":[183,198],"BlendMask-RT),":[185],"YOLO":[190],"v3,":[191],"SSD,":[192],"Faster":[194],"R-CNN)":[195],"models.":[196],"Taking":[197],"on":[199,231],"MS":[200],"COCO":[201],"as":[202,210],"an":[203],"example,":[204],"our":[205],"method":[206],"achieves":[207],"performance":[208],"+1.7":[211],"+6.2":[214],"AR<sub>100</sub>":[215,224],"detection,":[218],"+1.1":[220],"+3.5":[223],"segmentation,":[227],"with":[228],"27.1":[229],"FPS":[230],"one":[232],"NVIDIA":[233],"GTX":[234],"1080Ti":[235],"GPU.":[236],"All":[237],"source":[239],"code":[240],"trained":[242],"available":[245],"at":[246],"https://github.com/Zzh-tju/CIoU.":[247]},"counts_by_year":[{"year":2026,"cited_by_count":66},{"year":2025,"cited_by_count":450},{"year":2024,"cited_by_count":468},{"year":2023,"cited_by_count":248},{"year":2022,"cited_by_count":96},{"year":2021,"cited_by_count":25},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
