{"id":"https://openalex.org/W3206826736","doi":"https://doi.org/10.1145/3474085.3475314","title":"From Voxel to Point: IoU-guided 3D Object Detection for Point Cloud with Voxel-to-Point Decoder","display_name":"From Voxel to Point: IoU-guided 3D Object Detection for Point Cloud with Voxel-to-Point Decoder","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3206826736","doi":"https://doi.org/10.1145/3474085.3475314","mag":"3206826736"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475314","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475314","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://eprints.gla.ac.uk/303237/","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108050324","display_name":"Jiale Li","orcid":"https://orcid.org/0000-0002-3299-5386"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiale Li","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080852978","display_name":"Hang Dai","orcid":"https://orcid.org/0000-0002-7609-0124"},"institutions":[{"id":"https://openalex.org/I4210113480","display_name":"Mohamed bin Zayed University of Artificial Intelligence","ror":"https://ror.org/0258gkt32","country_code":"AE","type":"education","lineage":["https://openalex.org/I4210113480"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Hang Dai","raw_affiliation_strings":["Mohamed bin Zayed University of Artificial Intelligence, Abu Dhabi, UAE"],"affiliations":[{"raw_affiliation_string":"Mohamed bin Zayed University of Artificial Intelligence, Abu Dhabi, UAE","institution_ids":["https://openalex.org/I4210113480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082634513","display_name":"Ling Shao","orcid":"https://orcid.org/0000-0002-8264-6117"},"institutions":[{"id":"https://openalex.org/I4210116052","display_name":"Inception Institute of Artificial Intelligence","ror":"https://ror.org/02664zk40","country_code":"AE","type":"facility","lineage":["https://openalex.org/I4210116052"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Ling Shao","raw_affiliation_strings":["Inception Institute of Artificial Intelligence, Abu Dhabi, UAE"],"affiliations":[{"raw_affiliation_string":"Inception Institute of Artificial Intelligence, Abu Dhabi, UAE","institution_ids":["https://openalex.org/I4210116052"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100686691","display_name":"Yong Ding","orcid":"https://orcid.org/0000-0002-5226-7511"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Ding","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108050324"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":4.2622,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.95526405,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4622","last_page":"4631"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/voxel","display_name":"Voxel","score":0.8729538917541504},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8271936774253845},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.7617031335830688},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7364405989646912},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.6832230091094971},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.663765549659729},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.5420054793357849},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4981374740600586},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4945239722728729},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.442836731672287},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42206865549087524},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.1189461350440979},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10589998960494995}],"concepts":[{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.8729538917541504},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8271936774253845},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.7617031335830688},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7364405989646912},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.6832230091094971},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.663765549659729},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.5420054793357849},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4981374740600586},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4945239722728729},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.442836731672287},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42206865549087524},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.1189461350440979},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10589998960494995},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3474085.3475314","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475314","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.gla.ac.uk:303237","is_oa":true,"landing_page_url":"https://eprints.gla.ac.uk/303237/","pdf_url":null,"source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"pmh:oai:eprints.gla.ac.uk:303237","is_oa":true,"landing_page_url":"https://eprints.gla.ac.uk/303237/","pdf_url":null,"source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4047288554","display_name":null,"funder_award_id":"2018YFE0183900","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W601228132","https://openalex.org/W639708223","https://openalex.org/W1901129140","https://openalex.org/W2131396337","https://openalex.org/W2150066425","https://openalex.org/W2194775991","https://openalex.org/W2555618208","https://openalex.org/W2560609797","https://openalex.org/W2599765304","https://openalex.org/W2749581528","https://openalex.org/W2768282280","https://openalex.org/W2884561390","https://openalex.org/W2894705404","https://openalex.org/W2897529137","https://openalex.org/W2949708697","https://openalex.org/W2950946295","https://openalex.org/W2951517617","https://openalex.org/W2962807143","https://openalex.org/W2963121255","https://openalex.org/W2963182550","https://openalex.org/W2963400571","https://openalex.org/W2963587345","https://openalex.org/W2963727135","https://openalex.org/W2964062501","https://openalex.org/W2965615303","https://openalex.org/W2968296999","https://openalex.org/W2970828732","https://openalex.org/W2981709511","https://openalex.org/W2981949127","https://openalex.org/W2997814983","https://openalex.org/W3003618643","https://openalex.org/W3008105217","https://openalex.org/W3009445627","https://openalex.org/W3010527308","https://openalex.org/W3034000575","https://openalex.org/W3034314779","https://openalex.org/W3034494113","https://openalex.org/W3034602892","https://openalex.org/W3034681945","https://openalex.org/W3035346742","https://openalex.org/W3035461736","https://openalex.org/W3035748168","https://openalex.org/W3042259089","https://openalex.org/W3087774910","https://openalex.org/W3095522139","https://openalex.org/W3109675406","https://openalex.org/W3113968283","https://openalex.org/W3117804044","https://openalex.org/W3120465108","https://openalex.org/W3120703970","https://openalex.org/W3170984066","https://openalex.org/W3177497967","https://openalex.org/W4210257598","https://openalex.org/W4286696412","https://openalex.org/W4288092002","https://openalex.org/W4301045096"],"related_works":["https://openalex.org/W3027020613","https://openalex.org/W2016533837","https://openalex.org/W3167885074","https://openalex.org/W2892386716","https://openalex.org/W1998563493","https://openalex.org/W4306164210","https://openalex.org/W4313316311","https://openalex.org/W4362608745","https://openalex.org/W2383143032","https://openalex.org/W2082728368"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,39],"present":[4],"an":[5],"Intersection-over-Union":[6],"(IoU)":[7],"guided":[8],"two-stage":[9],"3D":[10,64],"object":[11,84],"detector":[12],"with":[13,76,92,149],"a":[14,41,63,112,128],"voxel-to-point":[15,43],"decoder.":[16],"To":[17],"preserve":[18],"the":[19,28,47,53,57,74,77,83,93,100,106,119,123,153],"necessary":[20],"information":[21,104],"from":[22,56],"all":[23],"raw":[24],"points":[25],"and":[26,72,114,138],"maintain":[27],"high":[29],"box":[30,107],"recall":[31],"in":[32,50,105],"voxel":[33,58],"based":[34,59],"Region":[35,65],"Proposal":[36],"Network":[37],"(RPN),":[38],"propose":[40,111],"residual":[42],"decoder":[44],"to":[45,52,70,117,122],"extract":[46],"point":[48],"features":[49,55,75,88],"addition":[51],"map-view":[54],"RPN.":[60],"We":[61,110],"use":[62],"of":[66],"Interest":[67],"(RoI)":[68],"alignment":[69],"crop":[71],"align":[73,118],"proposal":[78,125],"boxes":[79,126],"for":[80],"accurately":[81],"perceiving":[82],"position.":[85],"The":[86,133,156],"RoI-Aligned":[87],"are":[89],"finally":[90],"aggregated":[91],"corner":[94,103],"geometry":[95],"embeddings":[96],"that":[97,143],"can":[98],"provide":[99],"potentially":[101],"missing":[102],"refinement":[108],"stage.":[109],"simple":[113],"efficient":[115],"method":[116,145],"estimated":[120],"IoUs":[121],"refined":[124],"as":[127],"more":[129],"relevant":[130],"localization":[131],"confidence.":[132],"comprehensive":[134],"experiments":[135],"on":[136,160],"KITTI":[137],"Waymo":[139],"Open":[140],"Dataset":[141],"demonstrate":[142],"our":[144],"achieves":[146],"significant":[147],"improvements":[148],"novel":[150],"architectures":[151],"against":[152],"existing":[154],"methods.":[155],"code":[157],"is":[158],"available":[159],"Github":[161],"URLhttps://github.com/jialeli1/From-Voxel-to-Point":[162],".":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":16},{"year":2022,"cited_by_count":13}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-10-10T00:00:00"}
