{"id":"https://openalex.org/W7135149688","doi":"https://doi.org/10.1109/tits.2026.3668950","title":"Temporal Range-Point-Voxel Fusion for Unified BEV Scene Perception and Motion Prediction","display_name":"Temporal Range-Point-Voxel Fusion for Unified BEV Scene Perception and Motion Prediction","publication_year":2026,"publication_date":"2026-03-11","ids":{"openalex":"https://openalex.org/W7135149688","doi":"https://doi.org/10.1109/tits.2026.3668950"},"language":null,"primary_location":{"id":"doi:10.1109/tits.2026.3668950","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2026.3668950","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128878620","display_name":"Yunlong Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunlong Wang","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128880986","display_name":"Kun Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Jiang","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4995-7244","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052685863","display_name":"Xinyu Jiao","orcid":"https://orcid.org/0000-0002-2462-1691"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyu Jiao","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043682012","display_name":"Jinyu Miao","orcid":"https://orcid.org/0000-0001-8558-9173"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinyu Miao","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128803477","display_name":"Yining Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yining Shi","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2926-925X","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128888949","display_name":"Zheng Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Fu","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5166-1525","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Mengmeng Yang","orcid":"https://orcid.org/0000-0002-3294-6437"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengmeng Yang","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3294-6437","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020028921","display_name":"Tuopu Wen","orcid":"https://orcid.org/0000-0002-3093-765X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tuopu Wen","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3093-765X","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128822272","display_name":"Diange Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Diange Yang","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0074-2448","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27593603,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":"5","first_page":"5072","last_page":"5086"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.4771000146865845,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.4771000146865845,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.20090000331401825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.12890000641345978,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.7235000133514404},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6266999840736389},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5928999781608582},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.569599986076355},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5353999733924866},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5113000273704529},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5037999749183655},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.486299991607666}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7904999852180481},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.7235000133514404},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7125999927520752},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6266999840736389},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5928999781608582},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.569599986076355},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5580000281333923},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5353999733924866},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5113000273704529},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5037999749183655},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.486299991607666},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4092000126838684},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.40450000762939453},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.34549999237060547},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.30000001192092896},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2639999985694885},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.26159998774528503}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2026.3668950","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2026.3668950","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2826808901","display_name":null,"funder_award_id":"Z221100008122011","funder_id":"https://openalex.org/F4320325902","funder_display_name":"Beijing Municipal Science and Technology Commission"},{"id":"https://openalex.org/G5369562728","display_name":null,"funder_award_id":"52402499","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7213601597","display_name":null,"funder_award_id":"U22A20104","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G951889214","display_name":null,"funder_award_id":"52472449","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320325902","display_name":"Beijing Municipal Science and Technology Commission","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LiDAR-based":[0,49],"bird\u2019s-eye-view":[1],"(BEV)":[2],"perception":[3,51,83],"has":[4],"emerged":[5],"as":[6,108],"an":[7,147],"appealing":[8],"approach":[9],"for":[10,84],"practical":[11],"autonomous":[12],"driving":[13],"applications":[14],"due":[15],"to":[16,31,59],"its":[17],"direct":[18],"leveraging":[19],"of":[20,39,105,194,221,231],"precise":[21],"3D":[22],"structures":[23],"and":[24,36,73,90,110,114,169,172,182],"delivering":[25],"efficient":[26],"performance.":[27,62],"This":[28],"paradigm":[29],"aims":[30],"jointly":[32,111],"determine":[33],"the":[34,152,159,167,224],"semantics":[35],"motion":[37,56,92,115,170,204],"states":[38],"various":[40],"traffic":[41],"participants":[42],"on":[43,55,117,180,213,235],"BEV":[44,50,87,118,195,214],"grids.":[45,119],"However,":[46],"most":[47],"existing":[48],"methods":[52],"primarily":[53],"focus":[54],"prediction,":[57],"leading":[58],"inferior":[60],"semantic":[61,88,113,128,133,140,168,196,215],"To":[63],"address":[64],"this":[65,78],"limitation,":[66],"we":[67,122],"propose":[68],"a":[69,103,125,210,219,228],"novel":[70,126],"multi-frame,":[71],"multi-view,":[72],"multi-task":[74],"unified":[75],"framework":[76],"in":[77,165,192,203],"work,":[79],"which":[80],"enhances":[81],"scene":[82],"both":[85,166],"improved":[86],"segmentation":[89,216],"comparative":[91],"prediction":[93],"performances.":[94],"Our":[95],"framework,":[96],"named":[97],"temporal":[98],"range-point-voxel":[99],"fusion":[100],"(T-RPVFusion),":[101],"leverages":[102],"sequence":[104],"LiDAR":[106,137],"sweeps":[107],"input":[109],"outputs":[112],"information":[116],"In":[120],"T-RPVFusion,":[121],"first":[123],"introduce":[124],"multi-view":[127],"encoder":[129],"that":[130,185],"extracts":[131],"high-quality":[132],"features":[134],"from":[135],"each":[136],"sweep.":[138],"These":[139],"feature":[141,149,161],"maps":[142],"are":[143],"then":[144],"aggregated":[145],"into":[146],"integrated":[148,160],"map":[150,162],"using":[151],"proposed":[153],"bi-layer":[154],"spatio-temporal":[155],"pyramid":[156],"network.":[157],"Subsequently,":[158],"undergoes":[163],"processing":[164],"heads":[171],"yields":[173],"corresponding":[174],"outputs,":[175],"respectively.":[176],"Extensive":[177],"experiments":[178],"conducted":[179],"Waymo":[181,236],"nuScenes":[183],"show":[184],"our":[186,207],"method":[187,208],"outperforms":[188],"previous":[189,225],"state-of-the-art":[190],"(SOTA)":[191],"terms":[193],"segmentation,":[197],"while":[198],"concurrently":[199],"demonstrating":[200],"comparable":[201],"performance":[202],"prediction.":[205],"Notably,":[206],"achieves":[209],"significant":[211],"improvement":[212],"task,":[217],"attaining":[218],"mIOU":[220,234],"49.5%,":[222],"surpassing":[223],"SOTA":[226],"with":[227],"great":[229],"margin":[230],"+":[232],"12.1%":[233],"Open":[237],"Dataset.":[238],"The":[239],"code":[240],"is":[241],"available":[242],"at":[243],"<italic":[244],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[245],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[246],"<uri>https://github.com/thuwyl/trpvfusion</uri>":[247],"</i>":[248]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2026-03-13T00:00:00"}
