{"id":"https://openalex.org/W4414196747","doi":"https://doi.org/10.1109/tip.2025.3607643","title":"Cost-Efficient Open Vocabulary 3D Scene Understanding Based on Semantic Probability","display_name":"Cost-Efficient Open Vocabulary 3D Scene Understanding Based on Semantic Probability","publication_year":2025,"publication_date":"2025-09-15","ids":{"openalex":"https://openalex.org/W4414196747","doi":"https://doi.org/10.1109/tip.2025.3607643","pmid":"https://pubmed.ncbi.nlm.nih.gov/40953420"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2025.3607643","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3607643","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101317957","display_name":"Lingfeng Shen","orcid":"https://orcid.org/0009-0001-2730-2485"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lingfeng Shen","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024853947","display_name":"Xiaoyao Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyao Wei","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084291326","display_name":"Gang Pan","orcid":"https://orcid.org/0000-0002-4049-6181"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Pan","raw_affiliation_strings":["College of Computer Science and Technology and the State Key Laboratory of Brain-Machine Intelligence, Zhejiang University, Hangzhou, Zhejiang, China","College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology and the State Key Laboratory of Brain-Machine Intelligence, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I4210123185","https://openalex.org/I55712492"]},{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068607581","display_name":"Qian Zheng","orcid":"https://orcid.org/0000-0003-3968-3622"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]},{"id":"https://openalex.org/I55712492","display_name":"Zhejiang University of Technology","ror":"https://ror.org/02djqfd08","country_code":"CN","type":"education","lineage":["https://openalex.org/I55712492"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qian Zheng","raw_affiliation_strings":["College of Computer Science and Technology and the State Key Laboratory of Brain-Machine Intelligence, Zhejiang University, Hangzhou, Zhejiang, China","College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology and the State Key Laboratory of Brain-Machine Intelligence, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I4210123185","https://openalex.org/I55712492"]},{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031390008","display_name":"Yanlong Cao","orcid":"https://orcid.org/0000-0003-0383-6586"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanlong Cao","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, School of Mechanical Engineering, and Zhejiang Key Laboratory of Advanced Equipment Manufacturing and Measurement Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]},{"raw_affiliation_string":"School of Mechanical Engineering, State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101317957"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.25551933,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":null,"first_page":"1832","last_page":"1845"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6654000282287598},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6266999840736389},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6236000061035156},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5511000156402588},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5421000123023987},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4828999936580658},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.4650999903678894},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4221000075340271}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8036999702453613},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7099999785423279},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6654000282287598},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6266999840736389},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6236000061035156},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5511000156402588},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5421000123023987},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5113000273704529},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4828999936580658},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.4650999903678894},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4221000075340271},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4025000035762787},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4000000059604645},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3968999981880188},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.3716999888420105},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.36910000443458557},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35839998722076416},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3481999933719635},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.3199000060558319},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29670000076293945},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C202708506","wikidata":"https://www.wikidata.org/wiki/Q7449050","display_name":"Semantic compression","level":5,"score":0.262800008058548},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.2515999972820282}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2025.3607643","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3607643","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:40953420","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40953420","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1920022804","https://openalex.org/W2116588463","https://openalex.org/W2523049145","https://openalex.org/W2594519801","https://openalex.org/W2795014656","https://openalex.org/W2963125977","https://openalex.org/W2963182550","https://openalex.org/W2963530975","https://openalex.org/W2964339842","https://openalex.org/W2968296999","https://openalex.org/W3035574168","https://openalex.org/W3107521863","https://openalex.org/W3109154950","https://openalex.org/W3110503160","https://openalex.org/W3166470370","https://openalex.org/W3167095230","https://openalex.org/W3175450634","https://openalex.org/W3195577467","https://openalex.org/W4205189682","https://openalex.org/W4221154700","https://openalex.org/W4226058394","https://openalex.org/W4226389400","https://openalex.org/W4312274934","https://openalex.org/W4312458986","https://openalex.org/W4312649925","https://openalex.org/W4312912313","https://openalex.org/W4312935996","https://openalex.org/W4312960937","https://openalex.org/W4312980231","https://openalex.org/W4378781606","https://openalex.org/W4383108296","https://openalex.org/W4383108895","https://openalex.org/W4383109105","https://openalex.org/W4386065512","https://openalex.org/W4386065742","https://openalex.org/W4386065874","https://openalex.org/W4386066076","https://openalex.org/W4386075561","https://openalex.org/W4386075580","https://openalex.org/W4386076397","https://openalex.org/W4390190234","https://openalex.org/W4390872744","https://openalex.org/W4391547487","https://openalex.org/W4402704512","https://openalex.org/W4407900973"],"related_works":[],"abstract_inverted_index":{"Traditional":[0],"3D":[1,8,51,110,133,141,158,165,173],"scene":[2,52,174],"understanding":[3,53],"methods":[4],"heavily":[5],"depend":[6],"on":[7,60,104,136,144,193],"annotation":[9],"and":[10,69,106,167,201],"training,":[11],"which":[12],"allow":[13],"for":[14,164],"the":[15,31,40,81,85,89,93,124,128,154,168,172,180,187],"identification":[16],"of":[17,36,42,100,131,157,171],"seen":[18],"classes":[19],"but":[20],"struggle":[21],"to":[22,122,178],"recognize":[23],"unseen":[24],"classes.":[25],"In":[26,152],"this":[27],"paper,":[28],"we":[29,55,79,113,139],"leverage":[30],"open":[32,43,49,145],"vocabulary":[33,44,50],"inference":[34],"capabilities":[35],"pre-trained":[37,76,95],"models,":[38,96],"enabling":[39],"encoding":[41],"concepts.":[45],"However,":[46],"unlike":[47],"existing":[48],"methods,":[54],"propose":[56],"a":[57,115],"framework":[58],"based":[59,103],"semantic":[61,98,119,129,142,155],"probability.":[62],"This":[63],"innovation":[64],"significantly":[65],"reduces":[66],"computational":[67],"cost":[68],"is":[70],"compatible":[71],"with":[72,88],"state-of-the-art":[73],"two-stage":[74],"2D":[75,94],"models.":[77],"Specifically,":[78],"align":[80],"text":[82],"features":[83,91,170],"from":[84,92],"CLIP":[86],"model":[87],"pixel":[90],"inferring":[97],"probability":[99,130,137,156],"image":[101],"pixels":[102],"similarity":[105],"projecting":[107],"it":[108],"onto":[109],"points.":[111,134],"Subsequently,":[112],"introduce":[114],"point":[116,125],"cloud":[117],"pairs":[118],"fusion":[120],"method":[121,189],"merge":[123],"clouds,":[126],"reducing":[127],"erroneous":[132],"Based":[135],"scores,":[138],"achieve":[140],"segmentation":[143,181],"vocabularies":[146],"without":[147],"any":[148],"supervision":[149],"or":[150],"training.":[151],"addition,":[153],"points":[159],"can":[160,175],"serve":[161],"as":[162],"pseudo-labels":[163],"distillation,":[166],"geometric":[169],"be":[176],"exploited":[177],"improve":[179],"performance.":[182],"Experimental":[183],"results":[184],"demonstrate":[185],"that":[186],"proposed":[188],"exhibits":[190],"competitive":[191],"performance":[192],"publicly":[194],"available":[195],"benchmark":[196],"datasets,":[197],"including":[198],"ScanNet,":[199],"Matterport3D,":[200],"nuScenes.":[202]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
