{"id":"https://openalex.org/W4353004817","doi":"https://doi.org/10.1109/tcsvt.2023.3260115","title":"MedoidsFormer: A Strong 3D Object Detection Backbone by Exploiting Interaction With Adjacent Medoid Tokens","display_name":"MedoidsFormer: A Strong 3D Object Detection Backbone by Exploiting Interaction With Adjacent Medoid Tokens","publication_year":2023,"publication_date":"2023-03-21","ids":{"openalex":"https://openalex.org/W4353004817","doi":"https://doi.org/10.1109/tcsvt.2023.3260115"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3260115","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3260115","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015080274","display_name":"Xiao Yu Tian","orcid":"https://orcid.org/0000-0003-3472-9898"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaoyu Tian","raw_affiliation_strings":["School of Software, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103140342","display_name":"Ming Yang","orcid":"https://orcid.org/0000-0002-4277-7702"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Yang","raw_affiliation_strings":["School of Software, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101600341","display_name":"Qian Yu","orcid":"https://orcid.org/0000-0002-0538-7940"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qian Yu","raw_affiliation_strings":["School of Software, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080894318","display_name":"Jun\u2010Hai Yong","orcid":"https://orcid.org/0000-0002-4326-4167"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junhai Yong","raw_affiliation_strings":["School of Software, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082181536","display_name":"Dong Xu","orcid":"https://orcid.org/0000-0003-2775-9730"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Dong Xu","raw_affiliation_strings":["Department of Computer Science, The University of Hong Kong, Pokfulam, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, The University of Hong Kong, Pokfulam, Hong Kong","institution_ids":["https://openalex.org/I889458895"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5015080274"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.8423,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.87312948,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"33","issue":"10","first_page":"5844","last_page":"5854"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8390892744064331},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.645090639591217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6099550724029541},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5838965177536011},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5349377989768982},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5341184735298157},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4455392062664032},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.44373011589050293},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4322059154510498},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4226856827735901},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.343313992023468},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34291893243789673}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8390892744064331},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.645090639591217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6099550724029541},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5838965177536011},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5349377989768982},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5341184735298157},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4455392062664032},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.44373011589050293},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4322059154510498},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4226856827735901},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.343313992023468},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34291893243789673},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3260115","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3260115","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7400000095367432}],"awards":[{"id":"https://openalex.org/G4692674620","display_name":null,"funder_award_id":"62002012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322170","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":88,"referenced_works":["https://openalex.org/W2083620785","https://openalex.org/W2115579991","https://openalex.org/W2560609797","https://openalex.org/W2896457183","https://openalex.org/W2897529137","https://openalex.org/W2949708697","https://openalex.org/W2963120444","https://openalex.org/W2963121255","https://openalex.org/W2963727135","https://openalex.org/W2964062501","https://openalex.org/W2968296999","https://openalex.org/W2970597249","https://openalex.org/W2981949127","https://openalex.org/W3031752193","https://openalex.org/W3034314779","https://openalex.org/W3034681945","https://openalex.org/W3035172746","https://openalex.org/W3035346742","https://openalex.org/W3036853234","https://openalex.org/W3094502228","https://openalex.org/W3096609285","https://openalex.org/W3107212734","https://openalex.org/W3118341329","https://openalex.org/W3131500599","https://openalex.org/W3136022415","https://openalex.org/W3137278571","https://openalex.org/W3138516171","https://openalex.org/W3156811085","https://openalex.org/W3160179442","https://openalex.org/W3164543136","https://openalex.org/W3166089996","https://openalex.org/W3166470370","https://openalex.org/W3166712493","https://openalex.org/W3167095230","https://openalex.org/W3167539120","https://openalex.org/W3167732492","https://openalex.org/W3171087525","https://openalex.org/W3171125843","https://openalex.org/W3171377125","https://openalex.org/W3175544090","https://openalex.org/W3175563878","https://openalex.org/W3176153963","https://openalex.org/W3188046901","https://openalex.org/W3188283811","https://openalex.org/W3190216403","https://openalex.org/W3201719054","https://openalex.org/W3203949114","https://openalex.org/W3206826736","https://openalex.org/W3206836360","https://openalex.org/W3212645988","https://openalex.org/W3214586131","https://openalex.org/W3217340782","https://openalex.org/W4200632008","https://openalex.org/W4214490042","https://openalex.org/W4214493665","https://openalex.org/W4214755140","https://openalex.org/W4214777292","https://openalex.org/W4214893857","https://openalex.org/W4225531230","https://openalex.org/W4226391640","https://openalex.org/W4226396383","https://openalex.org/W4285186657","https://openalex.org/W4285197287","https://openalex.org/W4287204411","https://openalex.org/W4293704629","https://openalex.org/W4310078553","https://openalex.org/W4312307873","https://openalex.org/W4313007769","https://openalex.org/W4313149358","https://openalex.org/W4385245566","https://openalex.org/W6739778489","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6763701032","https://openalex.org/W6769571200","https://openalex.org/W6778485988","https://openalex.org/W6779564934","https://openalex.org/W6784333009","https://openalex.org/W6787846440","https://openalex.org/W6789760779","https://openalex.org/W6794906783","https://openalex.org/W6796931752","https://openalex.org/W6797360341","https://openalex.org/W6797790494","https://openalex.org/W6798016242","https://openalex.org/W6800092589","https://openalex.org/W6805849596","https://openalex.org/W6840571137"],"related_works":["https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W1482209366","https://openalex.org/W2110523656","https://openalex.org/W2521627374","https://openalex.org/W2981954115","https://openalex.org/W2901057123"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,53,89],"propose":[4],"MedoidsFormer,":[5],"a":[6,12,55,91],"novel":[7],"transformer-based":[8],"backbone":[9],"equipped":[10],"with":[11],"self-attention":[13,57,145],"mechanism":[14,58,146],"that":[15],"is":[16,37,43],"tailored":[17],"explicitly":[18],"to":[19,33,100,138],"LiDAR-based":[20],"3D":[21,47,116],"object":[22,26,48,117],"detection.":[23,49],"Unlike":[24],"2D":[25],"detection,":[27],"the":[28,34,127,140,143],"proportion":[29],"of":[30,83,142],"target":[31],"objects":[32],"input":[35],"scene":[36],"much":[38],"smaller,":[39],"and":[40,74,122,147],"their":[41],"distribution":[42],"significantly":[44],"sparser":[45],"in":[46],"Given":[50],"these":[51],"observations,":[52],"introduce":[54],"new":[56,144],"called":[59],"Medoids":[60],"Attention,":[61],"focusing":[62],"on":[63,126],"exploiting":[64],"interactions":[65],"within":[66],"surrounding":[67],"regions,":[68],"which":[69],"not":[70],"only":[71],"reduces":[72],"computation":[73],"memory":[75],"costs":[76],"but":[77],"obtains":[78],"discriminative":[79],"context":[80],"information.":[81],"Instead":[82],"aggregating":[84],"tokens":[85,104],"from":[86],"adjacent":[87],"areas,":[88],"present":[90],"dynamic":[92],"semantic-aware":[93],"token":[94],"mining":[95],"process":[96],"through":[97,119],"k-Medoids":[98],"clustering":[99],"direct":[101],"select":[102],"representative":[103],"for":[105],"attention":[106],"modeling.":[107],"Our":[108],"proposed":[109],"method":[110],"shows":[111],"consistent":[112],"improvement":[113],"over":[114],"existing":[115],"detectors":[118],"extensive":[120],"experiments":[121],"achieves":[123],"state-of-the-art":[124],"performance":[125],"large-scale":[128],"Waymo":[129],"Open":[130],"Dataset.":[131],"We":[132],"also":[133],"conduct":[134],"comprehensive":[135],"ablation":[136],"studies":[137],"verify":[139],"efficacy":[141],"provide":[148],"thorough":[149],"insights.":[150]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
