{"id":"https://openalex.org/W4388283616","doi":"https://doi.org/10.1109/tmm.2023.3330103","title":"Bounding Box Vectorization for Oriented Object Detection With Tanimoto Coefficient Regression","display_name":"Bounding Box Vectorization for Oriented Object Detection With Tanimoto Coefficient Regression","publication_year":2023,"publication_date":"2023-11-03","ids":{"openalex":"https://openalex.org/W4388283616","doi":"https://doi.org/10.1109/tmm.2023.3330103"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3330103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3330103","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102709426","display_name":"Linfei Wang","orcid":"https://orcid.org/0000-0003-1917-9031"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Linfei Wang","raw_affiliation_strings":["FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, China","FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","Yunnan United Vision Innovations Technology Co., Ltd, Kunming, P. R. China"],"affiliations":[{"raw_affiliation_string":"FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]},{"raw_affiliation_string":"FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","institution_ids":["https://openalex.org/I189210763"]},{"raw_affiliation_string":"Yunnan United Vision Innovations Technology Co., Ltd, Kunming, P. R. China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074672983","display_name":"Yibing Zhan","orcid":"https://orcid.org/0000-0003-3180-0484"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibing Zhan","raw_affiliation_strings":["JD Explore Academy, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD Explore Academy, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431792","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3865-8145"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Tencent AI Lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085309099","display_name":"Baosheng Yu","orcid":"https://orcid.org/0000-0002-0761-7893"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Baosheng Yu","raw_affiliation_strings":["University of Sydney, Camperdown, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of Sydney, Camperdown, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067600725","display_name":"Dapeng Tao","orcid":"https://orcid.org/0000-0003-0783-5273"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dapeng Tao","raw_affiliation_strings":["FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, China","FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","Yunnan Key Laboratory of Media Convergence, China"],"affiliations":[{"raw_affiliation_string":"FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]},{"raw_affiliation_string":"FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","institution_ids":["https://openalex.org/I189210763"]},{"raw_affiliation_string":"Yunnan Key Laboratory of Media Convergence, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102709426"],"corresponding_institution_ids":["https://openalex.org/I189210763"],"apc_list":null,"apc_paid":null,"fwci":2.773,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.92426085,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"26","issue":null,"first_page":"5181","last_page":"5193"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.9156680107116699},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7565980553627014},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.7117160558700562},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6431353688240051},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.5974085927009583},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.537205696105957},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.5330853462219238},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5101916790008545},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.5022537708282471},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4889332354068756},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.47387954592704773},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4515940845012665},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4288116693496704},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.41121363639831543},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21292227506637573},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.14155921339988708},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11535456776618958}],"concepts":[{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.9156680107116699},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7565980553627014},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.7117160558700562},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6431353688240051},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.5974085927009583},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.537205696105957},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.5330853462219238},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5101916790008545},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.5022537708282471},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4889332354068756},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.47387954592704773},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4515940845012665},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4288116693496704},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.41121363639831543},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21292227506637573},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.14155921339988708},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11535456776618958},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3330103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3330103","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6000861853","display_name":null,"funder_award_id":"62172354","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W1963917497","https://openalex.org/W2150066425","https://openalex.org/W2160114756","https://openalex.org/W2504335775","https://openalex.org/W2594177559","https://openalex.org/W2725486421","https://openalex.org/W2772143815","https://openalex.org/W2801995602","https://openalex.org/W2962749812","https://openalex.org/W2963351448","https://openalex.org/W2964979676","https://openalex.org/W2967487473","https://openalex.org/W2968296999","https://openalex.org/W2982770724","https://openalex.org/W2991363140","https://openalex.org/W2997624179","https://openalex.org/W3022917557","https://openalex.org/W3034993937","https://openalex.org/W3047669229","https://openalex.org/W3082900443","https://openalex.org/W3097779785","https://openalex.org/W3099598395","https://openalex.org/W3100234280","https://openalex.org/W3136761610","https://openalex.org/W3157386596","https://openalex.org/W3170033848","https://openalex.org/W3173367141","https://openalex.org/W3174389852","https://openalex.org/W3174873843","https://openalex.org/W3177105943","https://openalex.org/W3186269967","https://openalex.org/W3189348500","https://openalex.org/W3200733355","https://openalex.org/W3211980987","https://openalex.org/W4207055281","https://openalex.org/W4211114389","https://openalex.org/W4211247672","https://openalex.org/W4214648418","https://openalex.org/W4225590475","https://openalex.org/W4288325606","https://openalex.org/W4290715466","https://openalex.org/W4293679656","https://openalex.org/W4304084055","https://openalex.org/W4312804579","https://openalex.org/W4312961412","https://openalex.org/W4313153210","https://openalex.org/W4385573252","https://openalex.org/W4386065355","https://openalex.org/W6739844568","https://openalex.org/W6764322716","https://openalex.org/W6766533318","https://openalex.org/W6788031712","https://openalex.org/W6788870397","https://openalex.org/W6811378280"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"Current":[0],"oriented":[1,44,115,188],"object":[2,45,95,157,189],"detection":[3,190],"methods":[4,208],"mainly":[5],"utilize":[6],"a":[7,78,97,136,211],"vanilla":[8],"coordinate-angle":[9],"representation":[10],"for":[11],"bounding":[12,22,83,116,132],"box":[13,23,84,117,133],"regression,":[14],"which":[15],"usually":[16],"suffers":[17],"from":[18],"inconsistency":[19,111],"between":[20],"the":[21,42,73,89,105,110,123,128,131,145,150,159,178,199,204],"regression":[24,80],"losses":[25],"and":[26,38,91,138,141,195],"prediction":[27],"errors":[28],"induced":[29],"with":[30,82,96],"respect":[31],"to":[32,126,144,155,166],"different":[33],"rotation":[34],"angles,":[35],"aspect":[36],"ratios,":[37],"scales.":[39],"Therefore,":[40],"although":[41],"existing":[43],"detectors":[46],"have":[47],"achieved":[48],"very":[49],"good":[50],"performances":[51],"under":[52],"coarse":[53],"evaluation":[54,66,214],"metrics":[55],"such":[56,68,172],"as":[57,69,149,173],"AP50,":[58],"their":[59],"performance":[60],"significantly":[61,202],"degrades":[62],"when":[63,209],"using":[64,210],"stricter":[65],"metric":[67],"AP75.":[70],"To":[71],"address":[72],"abovementioned":[74],"issues,":[75],"we":[76,121,142],"propose":[77],"new":[79],"method":[81,107,161,180,201],"vectorization":[85],"that":[86],"implicitly":[87],"represents":[88],"shape":[90],"orientation":[92,170],"of":[93,99,130],"an":[94],"set":[98],"orthogonal":[100],"vectors.":[101],"By":[102],"doing":[103],"this,":[104],"proposed":[106,146,160,179,200],"delicately":[108],"avoids":[109],"issues":[112],"encountered":[113],"in":[114,135],"regression.":[118],"During":[119],"training,":[120],"introduce":[122],"Tanimoto":[124],"coefficient":[125],"evaluate":[127,177],"similarity":[129],"vector":[134],"shape-":[137],"orientation-aware":[139],"manner,":[140],"refer":[143],"box-to-vector":[147],"loss":[148],"B2V":[151],"loss.":[152],"In":[153],"addition":[154],"2D":[156,194],"detection,":[158],"can":[162],"be":[163],"easily":[164],"generalized":[165],"3D":[167,196],"scenarios":[168],"involving":[169],"estimation,":[171],"autonomous":[174],"driving.":[175],"We":[176],"through":[181],"extensive":[182],"experiments":[183],"conducted":[184],"on":[185],"four":[186],"popular":[187],"datasets,":[191,197],"including":[192],"both":[193],"where":[198],"outperforms":[203],"recently":[205],"developed":[206],"state-of-the-art":[207],"more":[212],"accurate":[213],"metric.":[215]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":6}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
