{"id":"https://openalex.org/W7134925935","doi":"https://doi.org/10.48550/arxiv.2603.09737","title":"$M^2$-Occ: Resilient 3D Semantic Occupancy Prediction for Autonomous Driving with Incomplete Camera Inputs","display_name":"$M^2$-Occ: Resilient 3D Semantic Occupancy Prediction for Autonomous Driving with Incomplete Camera Inputs","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134925935","doi":"https://doi.org/10.48550/arxiv.2603.09737"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09737","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078686627","display_name":"kaixin lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lin, Kaixin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128761048","display_name":"Kunyu Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Kunyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128778895","display_name":"Di Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Di","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128791952","display_name":"Yufan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yufan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128751210","display_name":"Ruiping Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ruiping","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128774703","display_name":"Kailun Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Kailun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5078686627"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.22169999778270721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.22169999778270721,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.1673000007867813,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.15189999341964722,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5976999998092651},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5254999995231628},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5145999789237976},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4925000071525574},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.4848000109195709},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4699000120162964},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.4691999852657318},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.4092000126838684},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.390500009059906}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7817000150680542},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5976999998092651},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5375000238418579},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5254999995231628},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5145999789237976},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4925000071525574},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.4848000109195709},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4699000120162964},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.4691999852657318},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.4092000126838684},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39430001378059387},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.390500009059906},{"id":"https://openalex.org/C160331591","wikidata":"https://www.wikidata.org/wiki/Q7075743","display_name":"Occupancy","level":2,"score":0.3831000030040741},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.37619999051094055},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.37380000948905945},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.36149999499320984},{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.3474000096321106},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33719998598098755},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.31779998540878296},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3158000111579895},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.2799000144004822},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27559998631477356},{"id":"https://openalex.org/C57077369","wikidata":"https://www.wikidata.org/wiki/Q7075747","display_name":"Occupancy grid mapping","level":4,"score":0.2687000036239624},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2685999870300293},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.26750001311302185},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.266400009393692},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Semantic":[0],"occupancy":[1,41],"prediction":[2,42],"enables":[3],"dense":[4],"3D":[5],"geometric":[6,55],"and":[7,47,57,110,147],"semantic":[8,40,58,106,122],"understanding":[9],"for":[10,176],"autonomous":[11],"driving.":[12],"However,":[13],"existing":[14],"camera-based":[15],"approaches":[16],"implicitly":[17],"assume":[18],"complete":[19],"surround-view":[20],"observations,":[21],"an":[22],"assumption":[23],"that":[24,103],"rarely":[25],"holds":[26],"in":[27,88],"real-world":[28],"deployment":[29],"due":[30],"to":[31,53,83],"occlusion,":[32],"hardware":[33],"malfunction,":[34],"or":[35],"communication":[36],"failures.":[37],"We":[38,130],"study":[39],"under":[43,178],"incomplete":[44],"multi-camera":[45],"inputs":[46],"introduce":[48,131],"$M^2$-Occ,":[49],"a":[50,70,93,99,132],"framework":[51],"designed":[52],"preserve":[54],"structure":[56],"coherence":[59],"when":[60,125],"views":[61],"are":[62,194],"missing.":[63],"$M^2$-Occ":[64,158],"addresses":[65],"two":[66],"complementary":[67],"challenges.":[68],"First,":[69],"Multi-view":[71],"Masked":[72],"Reconstruction":[73],"(MMR)":[74],"module":[75],"leverages":[76],"the":[77,89,115,138,153,160,165,171,179,188],"spatial":[78],"overlap":[79],"among":[80],"neighboring":[81],"cameras":[82,169],"recover":[84],"missing-view":[85,134],"representations":[86],"directly":[87],"feature":[90],"space.":[91],"Second,":[92],"Feature":[94],"Memory":[95],"Module":[96],"(FMM)":[97],"introduces":[98],"learnable":[100],"memory":[101],"bank":[102],"stores":[104],"class-level":[105],"prototypes.":[107],"By":[108],"retrieving":[109],"integrating":[111],"these":[112],"global":[113],"priors,":[114],"FMM":[116],"refines":[117],"ambiguous":[118],"voxel":[119],"features,":[120],"ensuring":[121],"consistency":[123],"even":[124],"observational":[126],"evidence":[127],"is":[128],"incomplete.":[129],"systematic":[133],"evaluation":[135],"protocol":[136],"on":[137],"nuScenes-based":[139],"SurroundOcc":[140],"benchmark,":[141],"encompassing":[142],"both":[143],"deterministic":[144],"single-view":[145],"failures":[146],"stochastic":[148],"multi-view":[149],"dropout":[150],"scenarios.":[151],"Under":[152],"safety-critical":[154],"missing":[155,168,183],"back-view":[156],"setting,":[157],"improves":[159],"IoU":[161,189],"by":[162,190],"4.93%.":[163],"As":[164],"number":[166],"of":[167],"increases,":[170],"robustness":[172],"gap":[173],"further":[174],"widens;":[175],"instance,":[177],"setting":[180],"with":[181],"five":[182],"views,":[184],"our":[185],"method":[186],"boosts":[187],"5.01%.":[191],"These":[192],"gains":[193],"achieved":[195],"without":[196],"compromising":[197],"full-view":[198],"performance.":[199],"The":[200],"source":[201],"code":[202],"will":[203],"be":[204],"publicly":[205],"released":[206],"at":[207],"https://github.com/qixi7up/M2-Occ.":[208]},"counts_by_year":[],"updated_date":"2026-03-12T06:18:43.230356","created_date":"2026-03-12T00:00:00"}
