{"id":"https://openalex.org/W7128688323","doi":"https://doi.org/10.48550/arxiv.2602.11007","title":"LaSSM: Efficient Semantic-Spatial Query Decoding via Local Aggregation and State Space Models for 3D Instance Segmentation","display_name":"LaSSM: Efficient Semantic-Spatial Query Decoding via Local Aggregation and State Space Models for 3D Instance Segmentation","publication_year":2026,"publication_date":"2026-02-11","ids":{"openalex":"https://openalex.org/W7128688323","doi":"https://doi.org/10.48550/arxiv.2602.11007"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.11007","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125741200","display_name":"Lei Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yao, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125730155","display_name":"Yi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125746372","display_name":"Yawen Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Yawen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016553220","display_name":"Moyun Liu","orcid":"https://orcid.org/0000-0002-4530-2606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Moyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125689196","display_name":"Lap-Pui Chau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chau, Lap-Pui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5125741200"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.8378000259399414,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.8378000259399414,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.06520000100135803,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.01209999993443489,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.6650000214576721},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5200999975204468},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4803999960422516},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4781999886035919},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.45260000228881836},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.438400000333786},{"id":"https://openalex.org/keywords/online-aggregation","display_name":"Online aggregation","score":0.42320001125335693},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.42170000076293945},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.3962000012397766}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7738999724388123},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.6650000214576721},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5200999975204468},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4803999960422516},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4781999886035919},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.45260000228881836},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.438400000333786},{"id":"https://openalex.org/C24028149","wikidata":"https://www.wikidata.org/wiki/Q7094056","display_name":"Online aggregation","level":5,"score":0.42320001125335693},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.42170000076293945},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4052000045776367},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3962000012397766},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.39250001311302185},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37940001487731934},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.3684999942779541},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32519999146461487},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.32409998774528503},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3066999912261963},{"id":"https://openalex.org/C13670688","wikidata":"https://www.wikidata.org/wiki/Q3500548","display_name":"Space partitioning","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2776372474","wikidata":"https://www.wikidata.org/wiki/Q508291","display_name":"Simplicity","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25760000944137573},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25200000405311584}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.11007","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.11007","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11007","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.11007","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Query-based":[0],"3D":[1],"scene":[2,76,176],"instance":[3,136,177],"segmentation":[4],"from":[5,16,64],"point":[6,27],"clouds":[7,28],"has":[8],"attained":[9],"notable":[10],"performance.":[11,50],"However,":[12],"existing":[13],"methods":[14],"suffer":[15],"the":[17,23,61,105,124,139,153,159,203],"query":[18,37,57,62,125],"initialization":[19],"dilemma":[20],"due":[21],"to":[22,59,107,119],"sparse":[24],"nature":[25],"of":[26,141,205],"and":[29,45,71,78,113,144,188,199,210],"rely":[30],"on":[31,109,152,184],"computationally":[32],"intensive":[33],"attention":[34],"mechanisms":[35],"in":[36,173],"decoders.":[38],"We":[39,81],"accordingly":[40],"introduce":[41],"LaSSM,":[42],"prioritizing":[43],"simplicity":[44],"efficiency":[46],"while":[47],"maintaining":[48],"competitive":[49,182],"Specifically,":[51],"we":[52],"propose":[53],"a":[54,84,99,114],"hierarchical":[55],"semantic-spatial":[56],"initializer":[58],"derive":[60],"set":[63,126],"superpoints":[65],"by":[66,127,163],"considering":[67],"both":[68],"semantic":[69],"cues":[70],"spatial":[72,115],"distribution,":[73],"achieving":[74],"comprehensive":[75],"coverage":[77],"accelerated":[79],"convergence.":[80],"further":[82],"present":[83],"coordinate-guided":[85],"state":[86],"space":[87],"model":[88,106],"(SSM)":[89],"decoder":[90,97],"that":[91,103],"progressively":[92],"refines":[93],"queries.":[94],"The":[95,208],"novel":[96],"features":[98],"local":[100],"aggregation":[101],"scheme":[102],"restricts":[104],"focus":[108],"geometrically":[110],"coherent":[111],"regions":[112],"dual-path":[116],"SSM":[117],"block":[118],"capture":[120],"underlying":[121],"dependencies":[122],"within":[123],"integrating":[128],"associated":[129],"coordinates":[130],"information.":[131],"Our":[132],"design":[133],"enables":[134],"efficient":[135],"prediction,":[137],"avoiding":[138],"incorporation":[140],"noisy":[142],"information":[143],"reducing":[145],"redundant":[146],"computation.":[147],"LaSSM":[148,179],"ranks":[149],"first":[150],"place":[151],"latest":[154],"ScanNet++":[155,189],"V2":[156],"leaderboard,":[157],"outperforming":[158],"previous":[160],"best":[161],"method":[162],"2.5%":[164],"mAP":[165],"with":[166,192],"only":[167],"1/3":[168],"FLOPs,":[169],"demonstrating":[170],"its":[171],"superiority":[172],"challenging":[174],"large-scale":[175],"segmentation.":[178],"also":[180],"achieves":[181],"performance":[183],"ScanNet,":[185],"ScanNet200,":[186],"S3DIS":[187],"V1":[190],"benchmarks":[191],"less":[193],"computational":[194],"cost.":[195],"Extensive":[196],"ablation":[197],"studies":[198],"qualitative":[200],"results":[201],"validate":[202],"effectiveness":[204],"our":[206],"design.":[207],"code":[209],"weights":[211],"are":[212],"available":[213],"at":[214],"https://github.com/RayYoh/LaSSM.":[215]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-13T00:00:00"}
