{"id":"https://openalex.org/W7128440741","doi":"https://doi.org/10.1109/tip.2026.3660576","title":"Multi-Resolution Alignment for Voxel Sparsity in Camera-Based 3D Semantic Scene Completion","display_name":"Multi-Resolution Alignment for Voxel Sparsity in Camera-Based 3D Semantic Scene Completion","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7128440741","doi":"https://doi.org/10.1109/tip.2026.3660576","pmid":"https://pubmed.ncbi.nlm.nih.gov/41662539"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2026.3660576","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2026.3660576","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101936895","display_name":"Zhiwen Yang","orcid":"https://orcid.org/0000-0002-0416-0576"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwen Yang","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0416-0576","affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yuxin Peng","orcid":"https://orcid.org/0000-0001-7658-3845"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuxin Peng","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7658-3845","affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14953471,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":null,"first_page":"1771","last_page":"1785"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.36309999227523804,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.36309999227523804,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.2922999858856201,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.18070000410079956,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/voxel","display_name":"Voxel","score":0.9020000100135803},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.598800003528595},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4918000102043152},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.4620000123977661},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4555000066757202},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4375999867916107},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.43650001287460327},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.39169999957084656}],"concepts":[{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.9020000100135803},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7893000245094299},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7505999803543091},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.598800003528595},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5503000020980835},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4918000102043152},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.4620000123977661},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4375999867916107},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.43650001287460327},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.39169999957084656},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36489999294281006},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32019999623298645},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.31630000472068787},{"id":"https://openalex.org/C31487907","wikidata":"https://www.wikidata.org/wiki/Q1154597","display_name":"Polygon mesh","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.25380000472068787}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2026.3660576","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2026.3660576","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:41662539","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41662539","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7142164707183838,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1709766391","display_name":null,"funder_award_id":"L257005","funder_id":"https://openalex.org/F4320334977","funder_display_name":"Beijing Municipal Natural Science Foundation"},{"id":"https://openalex.org/G3506972120","display_name":null,"funder_award_id":"L247006","funder_id":"https://openalex.org/F4320334977","funder_display_name":"Beijing Municipal Natural Science Foundation"},{"id":"https://openalex.org/G3509253272","display_name":null,"funder_award_id":"62432001","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6078352744","display_name":null,"funder_award_id":"62132001","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8190739672","display_name":null,"funder_award_id":"62525201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334977","display_name":"Beijing Municipal Natural Science Foundation","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2150066425","https://openalex.org/W2194775991","https://openalex.org/W2412782625","https://openalex.org/W2557465155","https://openalex.org/W2565639579","https://openalex.org/W2795587607","https://openalex.org/W2963766190","https://openalex.org/W2985561844","https://openalex.org/W2991216808","https://openalex.org/W3035524453","https://openalex.org/W3109395584","https://openalex.org/W3109428934","https://openalex.org/W3126856052","https://openalex.org/W3174692508","https://openalex.org/W3179909833","https://openalex.org/W3195680177","https://openalex.org/W3201467792","https://openalex.org/W3215584334","https://openalex.org/W4200308510","https://openalex.org/W4214530037","https://openalex.org/W4312894406","https://openalex.org/W4378781606","https://openalex.org/W4382450829","https://openalex.org/W4382464460","https://openalex.org/W4383108371","https://openalex.org/W4386066358","https://openalex.org/W4386075718","https://openalex.org/W4386083035","https://openalex.org/W4389666133","https://openalex.org/W4390872682","https://openalex.org/W4390873564","https://openalex.org/W4390874310","https://openalex.org/W4393153987","https://openalex.org/W4402703001","https://openalex.org/W4402753672","https://openalex.org/W4402753845","https://openalex.org/W4402754012","https://openalex.org/W4402891997"],"related_works":[],"abstract_inverted_index":{"Camera-based":[0],"3D":[1,24,104,118,139],"semantic":[2,16,105,165,173,207],"scene":[3,25,32,106,111,146],"completion":[4],"(SSC)":[5],"offers":[6],"a":[7,30,68,93,176,184,190,211],"cost-effective":[8],"solution":[9],"for":[10,35,171,214],"assessing":[11],"the":[12,22,36,55,62,110,127,145,156,163,172,203,218,229,249],"geometric":[13],"occupancy":[14],"and":[15,60,84,112,141,209,231],"labels":[17,59],"of":[18,64,71,167,175,205,251],"each":[19,168],"voxel":[20,58,65,100,178,253],"in":[21,47,73,102,247],"surrounding":[23],"with":[26,202],"image":[27,135],"inputs,":[28],"providing":[29],"voxel-level":[31],"perception":[33],"foundation":[34],"perception-prediction-planning":[37],"autonomous":[38,74],"driving":[39,75],"systems.":[40],"Although":[41],"significant":[42],"progress":[43],"has":[44],"been":[45],"made":[46],"existing":[48,241],"methods,":[49,243],"their":[50],"optimization":[51,82],"rely":[52],"solely":[53],"on":[54,217,228],"supervision":[56,216],"from":[57],"face":[61],"challenge":[63],"sparsity":[66,101],"as":[67,120,199],"large":[69],"portion":[70],"voxels":[72,182,198],"scenarios":[76],"are":[77],"empty,":[78],"which":[79,108,132,195],"limits":[80],"both":[81],"efficiency":[83],"model":[85],"performance.":[86],"To":[87],"address":[88],"this":[89],"issue,":[90],"we":[91,124,154,188],"propose":[92,126],"Multi-Resolution":[94],"Alignment":[95,193],"(MRA)":[96],"approach":[97,238],"to":[98,161],"mitigate":[99],"camera-based":[103],"completion,":[107],"exploits":[109],"instance":[113],"level":[114,147],"alignment":[115],"across":[116,223],"multi-resolution":[117,138],"features":[119,136,140],"auxiliary":[121,215],"supervision.":[122],"Specifically,":[123],"first":[125],"Multi-resolution":[128],"View":[129],"Transformer":[130],"module,":[131,194],"projects":[133],"2D":[134],"into":[137],"aligns":[142],"them":[143],"at":[144,259],"through":[148],"fusing":[149],"discriminative":[150],"seed":[151],"features.":[152],"Furthermore,":[153],"design":[155],"Cubic":[157],"Semantic":[158],"Anisotropy":[159],"module":[160],"identify":[162],"instance-level":[164,200],"significance":[166],"voxel,":[169],"accounting":[170],"differences":[174],"specific":[177],"against":[179],"its":[180,245],"neighboring":[181],"within":[183],"cubic":[185,206],"area.":[186],"Finally,":[187],"devise":[189],"Critical":[191],"Distribution":[192],"selects":[196],"critical":[197,219],"anchors":[201],"guidance":[204],"anisotropy,":[208],"applies":[210],"circulated":[212],"loss":[213],"feature":[220],"distribution":[221],"consistency":[222],"different":[224],"resolutions.":[225],"Extensive":[226],"experiments":[227],"SemanticKITTI":[230],"SSCBench-KITTI-360":[232],"datasets":[233],"demonstrate":[234],"that":[235],"our":[236],"MRA":[237],"significantly":[239],"outperforms":[240],"state-of-the-art":[242],"showcasing":[244],"effectiveness":[246],"mitigating":[248],"impact":[250],"sparse":[252],"labels.":[254],"The":[255],"code":[256],"is":[257],"available":[258],"https://github.com/PKU-ICST-MIPL/MRA_TIP.":[260]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2026-02-07T00:00:00"}
