{"id":"https://openalex.org/W4410028551","doi":"https://doi.org/10.1109/tpami.2025.3566593","title":"General 3D Vision-Language Model With Fast Rendering and Pre-Training Vision-Language Alignment","display_name":"General 3D Vision-Language Model With Fast Rendering and Pre-Training Vision-Language Alignment","publication_year":2025,"publication_date":"2025-05-02","ids":{"openalex":"https://openalex.org/W4410028551","doi":"https://doi.org/10.1109/tpami.2025.3566593","pmid":"https://pubmed.ncbi.nlm.nih.gov/40315072"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3566593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3566593","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073973915","display_name":"Kangcheng Liu","orcid":"https://orcid.org/0000-0002-8387-3565"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kangcheng Liu","raw_affiliation_strings":["Division of Engineering and Applied Science, California Institute of Technology (Caltech), Pasadena, CA, USA","Division of Engineering and Applied Science, California Institute of Technology (Caltech), Pasadena, USA"],"affiliations":[{"raw_affiliation_string":"Division of Engineering and Applied Science, California Institute of Technology (Caltech), Pasadena, CA, USA","institution_ids":["https://openalex.org/I122411786"]},{"raw_affiliation_string":"Division of Engineering and Applied Science, California Institute of Technology (Caltech), Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008076279","display_name":"Yong\u2010Jin Liu","orcid":"https://orcid.org/0000-0001-5774-1916"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong-Jin Liu","raw_affiliation_strings":["BNRist, MOE-Key Laboratory of Pervasive Computing, Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"BNRist, MOE-Key Laboratory of Pervasive Computing, Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":null,"display_name":"Baoquan Chen","orcid":"https://orcid.org/0000-0003-4702-036X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baoquan Chen","raw_affiliation_strings":["National Key Lab of Genaral AI, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Lab of Genaral AI, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5073973915"],"corresponding_institution_ids":["https://openalex.org/I122411786"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07339962,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"47","issue":"9","first_page":"7352","last_page":"7368"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9688000082969666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7633056640625},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7318314909934998},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6683226227760315},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.5071330070495605},{"id":"https://openalex.org/keywords/machine-vision","display_name":"Machine vision","score":0.46552297472953796},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3392651677131653}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7633056640625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7318314909934998},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6683226227760315},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.5071330070495605},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.46552297472953796},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3392651677131653}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3566593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3566593","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40315072","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40315072","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4456321350","display_name":null,"funder_award_id":"62461160309","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7896783442","display_name":null,"funder_award_id":"62403400","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":113,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1923184257","https://openalex.org/W2002827932","https://openalex.org/W2109067131","https://openalex.org/W2115579991","https://openalex.org/W2149616971","https://openalex.org/W2152864241","https://openalex.org/W2167667767","https://openalex.org/W2412782625","https://openalex.org/W2460657278","https://openalex.org/W2594519801","https://openalex.org/W2799162093","https://openalex.org/W2904332125","https://openalex.org/W2949708697","https://openalex.org/W2955873422","https://openalex.org/W2963125977","https://openalex.org/W2963182550","https://openalex.org/W2968557240","https://openalex.org/W2981983525","https://openalex.org/W2985088149","https://openalex.org/W2988715931","https://openalex.org/W2991216808","https://openalex.org/W3008105217","https://openalex.org/W3009201938","https://openalex.org/W3012494314","https://openalex.org/W3014902535","https://openalex.org/W3034239841","https://openalex.org/W3034266912","https://openalex.org/W3034314779","https://openalex.org/W3034949383","https://openalex.org/W3035057392","https://openalex.org/W3035272603","https://openalex.org/W3035426492","https://openalex.org/W3035574168","https://openalex.org/W3035739565","https://openalex.org/W3036560856","https://openalex.org/W3109944402","https://openalex.org/W3110047846","https://openalex.org/W3110503160","https://openalex.org/W3116730076","https://openalex.org/W3116959466","https://openalex.org/W3152786524","https://openalex.org/W3166573884","https://openalex.org/W3167071962","https://openalex.org/W3167095230","https://openalex.org/W3167684723","https://openalex.org/W3167855660","https://openalex.org/W3169120894","https://openalex.org/W3171215128","https://openalex.org/W3177276051","https://openalex.org/W3177280664","https://openalex.org/W3178218920","https://openalex.org/W3179630053","https://openalex.org/W3181190968","https://openalex.org/W3186678659","https://openalex.org/W3202349074","https://openalex.org/W3202611145","https://openalex.org/W3202623927","https://openalex.org/W3205364888","https://openalex.org/W3217135629","https://openalex.org/W4205189682","https://openalex.org/W4206398307","https://openalex.org/W4221145169","https://openalex.org/W4285102311","https://openalex.org/W4288751081","https://openalex.org/W4302276600","https://openalex.org/W4310078553","https://openalex.org/W4312699854","https://openalex.org/W4312812384","https://openalex.org/W4312818263","https://openalex.org/W4312960937","https://openalex.org/W4313056955","https://openalex.org/W4313213824","https://openalex.org/W4313400313","https://openalex.org/W4321194933","https://openalex.org/W4382240808","https://openalex.org/W4385431115","https://openalex.org/W4386065568","https://openalex.org/W4386065804","https://openalex.org/W4386066076","https://openalex.org/W4386071681","https://openalex.org/W4386071966","https://openalex.org/W4386072165","https://openalex.org/W4386075694","https://openalex.org/W4386076066","https://openalex.org/W4386076097","https://openalex.org/W4386083124","https://openalex.org/W4390872695","https://openalex.org/W4390873936","https://openalex.org/W4390874324","https://openalex.org/W4390874386","https://openalex.org/W4390874575","https://openalex.org/W4393074218","https://openalex.org/W4395455125","https://openalex.org/W4399410938","https://openalex.org/W4402667898","https://openalex.org/W4402716083","https://openalex.org/W4410536678","https://openalex.org/W6631190155","https://openalex.org/W6764136514","https://openalex.org/W6765299845","https://openalex.org/W6776539250","https://openalex.org/W6786169801","https://openalex.org/W6789930856","https://openalex.org/W6791353385","https://openalex.org/W6793963566","https://openalex.org/W6810334672","https://openalex.org/W6838957033","https://openalex.org/W6846033935","https://openalex.org/W6846133297","https://openalex.org/W6846835116","https://openalex.org/W6849571719","https://openalex.org/W6851607685"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Current":[0],"prevailing":[1],"vision-language":[2,161,181],"models":[3,39],"have":[4,42],"achieved":[5],"remarkable":[6],"progress":[7],"in":[8,14,55,94,102,122,310],"3D":[9,29,74,115,142],"scene":[10,30,75,143,188],"understanding":[11,76,144,189],"while":[12],"trained":[13],"the":[15,26,43,52,70,123,126,146,159,186,193,207,222,236,241,249,261,267,285,305],"closed-set":[16],"setting":[17],"and":[18,119,136,169,175,216,272,290,294,301,314],"with":[19,141,202,298],"full":[20],"labels.":[21],"The":[22],"major":[23],"bottleneck":[24],"for":[25,33,139,155,229],"current":[27,72],"robot":[28,58,62,67],"recognition":[31],"approach":[32,309],"robotic":[34],"applications":[35,59],"is":[36],"that":[37,108],"these":[38],"do":[40],"not":[41],"capacity":[44],"to":[45,86,113,173,217,239],"recognize":[46],"any":[47],"unseen":[48],"novel":[49,156,199],"classes":[50],"beyond":[51],"training":[53],"categories":[54,157],"diverse":[56],"real-world":[57],"such":[60],"as":[61,64,66],"manipulation":[63],"well":[65,93],"navigation.":[68],"In":[69,248],"meantime,":[71],"state-of-the-art":[73,280],"approaches":[77],"primarily":[78],"require":[79],"a":[80,95,106,134,165,198],"large":[81],"number":[82],"of":[83,105,235,269,307],"high-quality":[84],"labels":[85,127],"train":[87],"neural":[88,237],"networks,":[89],"which":[90,183],"merely":[91],"perform":[92],"fully":[96],"supervised":[97],"manner.":[98],"Therefore,":[99],"we":[100,163,196,220],"are":[101,128,149],"urgent":[103],"need":[104],"framework":[107,138],"can":[109],"simultaneously":[110],"be":[111],"applicable":[112],"both":[114,266,299,311],"point":[116,230],"cloud":[117],"segmentation":[118,271],"detection,":[120],"particularly":[121],"circumstances":[124],"where":[125],"rather":[129],"scarce.":[130],"This":[131],"work":[132],"presents":[133],"generalized":[135],"straightforward":[137],"dealing":[140],"when":[145],"labeled":[147],"scenes":[148,303],"quite":[150],"limited.":[151],"To":[152,191,211],"extract":[153,174],"knowledge":[154,170],"from":[158,179,206],"pre-trained":[160],"models,":[162,182],"propose":[164,197,221],"hierarchical":[166],"feature-aligned":[167],"pre-training":[168],"distillation":[171],"strategy":[172],"distill":[176],"meaningful":[177],"information":[178],"large-scale":[180,262,287],"helps":[184],"benefit":[185],"open-vocabulary":[187],"tasks.":[190],"leverage":[192],"boundary":[194,203,209],"information,":[195],"energy-based":[200],"loss":[201],"awareness":[204],"benefiting":[205],"region-level":[208,224],"predictions.":[210],"encourage":[212],"latent":[213],"instance":[214,273],"discrimination":[215],"guarantee":[218],"efficiency,":[219],"unsupervised":[223],"semantic":[225,270],"contrastive":[226],"learning":[227,282,313],"scheme":[228],"clouds,":[231],"using":[232],"confident":[233],"predictions":[234],"network":[238],"discriminate":[240],"intermediate":[242],"feature":[243],"embeddings":[244],"at":[245],"multiple":[246],"stages.":[247],"limited":[250],"reconstruction":[251],"case,":[252],"our":[253,276,308],"proposed":[254,277],"approach,":[255],"termed":[256],"WS3D++,":[257],"ranks":[258],"1st":[259],"on":[260,265,284],"ScanNet":[263],"benchmark":[264],"task":[268],"segmentation.":[274],"Also,":[275],"WS3D++":[278],"achieves":[279],"data-efficient":[281,312],"performance":[283],"other":[286],"real-scene":[288],"indoor":[289,300],"outdoor":[291,302],"datasets":[292],"S3DIS":[293],"SemanticKITTI.":[295],"Extensive":[296],"experiments":[297],"demonstrated":[304],"effectiveness":[306],"open-world":[315],"few-shot":[316],"learning.":[317]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
