{"id":"https://openalex.org/W7138286728","doi":"https://doi.org/10.1609/aaai.v40i15.38238","title":"BEVDilation: LiDAR-Centric Multi-Modal Fusion for 3D Object Detection","display_name":"BEVDilation: LiDAR-Centric Multi-Modal Fusion for 3D Object Detection","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138286728","doi":"https://doi.org/10.1609/aaai.v40i15.38238"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i15.38238","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38238","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38238/42200","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38238/42200","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129700789","display_name":"Guowen Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Guowen Zhang","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129708126","display_name":"Chenhang He","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Chenhang He","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129664626","display_name":"Liyi Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Liyi Chen","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129692205","display_name":"Lei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5129700789"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":134.2,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.99701715,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"40","issue":"15","first_page":"12448","last_page":"12456"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8661999702453613,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8661999702453613,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.01940000057220459,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.014299999922513962,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.625},{"id":"https://openalex.org/keywords/dilation","display_name":"Dilation (metric space)","score":0.5522000193595886},{"id":"https://openalex.org/keywords/lidar","display_name":"Lidar","score":0.54830002784729},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5138999819755554},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.49390000104904175},{"id":"https://openalex.org/keywords/voxel","display_name":"Voxel","score":0.4611000120639801},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.43290001153945923},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.4131999909877777},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.4016999900341034},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.38749998807907104}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7842000126838684},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7508000135421753},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7143999934196472},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.625},{"id":"https://openalex.org/C2780757906","wikidata":"https://www.wikidata.org/wiki/Q5276676","display_name":"Dilation (metric space)","level":2,"score":0.5522000193595886},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.54830002784729},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5138999819755554},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.49390000104904175},{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.4611000120639801},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.43290001153945923},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.4131999909877777},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.4016999900341034},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.38749998807907104},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3797000050544739},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3790999948978424},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3578000068664551},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.34950000047683716},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3472000062465668},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.3456999957561493},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3411000072956085},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.33379998803138733},{"id":"https://openalex.org/C166704113","wikidata":"https://www.wikidata.org/wiki/Q861092","display_name":"Image registration","level":3,"score":0.32910001277923584},{"id":"https://openalex.org/C203595873","wikidata":"https://www.wikidata.org/wiki/Q25389927","display_name":"Change detection","level":2,"score":0.32589998841285706},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.3222000002861023},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.31859999895095825},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3179999887943268},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i15.38238","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38238","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38238/42200","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i15.38238","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38238","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38238/42200","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.598041832447052,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138286728.pdf","grobid_xml":"https://content.openalex.org/works/W7138286728.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Integrating":[0],"LiDAR":[1,54,136],"and":[2,98,144],"camera":[3],"information":[4,55],"in":[5,16,26,34,56],"the":[6,23,57,75,85,91,96,114,135,149],"bird's":[7],"eye":[8],"view":[9],"(BEV)":[10],"representation":[11],"has":[12],"demonstrated":[13],"its":[14],"effectiveness":[15],"3D":[17],"object":[18],"detection.":[19],"However,":[20],"because":[21],"of":[22,101],"fundamental":[24],"disparity":[25],"geometric":[27],"accuracy":[28],"between":[29],"these":[30],"sensors,":[31],"indiscriminate":[32],"fusion":[33],"previous":[35],"methods":[36,159],"often":[37],"leads":[38],"to":[39,94,133,172,176],"degraded":[40],"performance.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45,105,126],"propose":[46,106],"BEVDilation,":[47],"a":[48,107,128],"novel":[49],"LiDAR-centric":[50,92,167],"framework":[51],"that":[52,112],"prioritizes":[53],"fusion.":[58,178],"By":[59],"formulating":[60],"image":[61,80,86,123,141],"BEV":[62,130],"features":[63],"as":[64],"implicit":[65],"guidance":[66,87,143],"rather":[67],"than":[68,157],"naive":[69,177],"concatenation,":[70],"our":[71,166],"strategy":[72,168],"effectively":[73,89],"alleviates":[74],"spatial":[76],"misalignment":[77],"caused":[78],"by":[79,118],"depth":[81,173],"estimation":[82],"errors.":[83],"Furthermore,":[84],"can":[88],"help":[90],"paradigm":[93],"address":[95],"sparsity":[97,117],"semantic":[99,142],"limitations":[100],"point":[102,116],"clouds.":[103],"Specifically,":[104],"Sparse":[108],"Voxel":[109],"Dilation":[110,131],"Block":[111,132],"mitigates":[113],"inherent":[115],"densifying":[119],"foreground":[120],"voxels":[121],"through":[122],"priors.":[124],"Moreover,":[125],"introduce":[127],"Semantic-Guided":[129],"enhance":[134],"feature":[137],"diffusion":[138],"processing":[139],"with":[140],"long-range":[145],"context":[146],"capture.":[147],"On":[148],"challenging":[150],"nuScenes":[151],"benchmark,":[152],"BEVDilation":[153],"achieves":[154],"better":[155],"performance":[156],"state-of-the-art":[158],"while":[160],"maintaining":[161],"competitive":[162],"computational":[163],"efficiency.":[164],"Importantly,":[165],"demonstrates":[169],"greater":[170],"robustness":[171],"noise":[174],"compared":[175]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-29T08:15:47.926485","created_date":"2026-03-18T00:00:00"}
