{"id":"https://openalex.org/W7138333786","doi":"https://doi.org/10.1609/aaai.v40i8.37539","title":"Point Cloud Quantization Through Multimodal Prompting for 3D Understanding","display_name":"Point Cloud Quantization Through Multimodal Prompting for 3D Understanding","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138333786","doi":"https://doi.org/10.1609/aaai.v40i8.37539"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i8.37539","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i8.37539","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37539/41501","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37539/41501","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129751469","display_name":"Hongxuan Li","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongxuan Li","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129673467","display_name":"Wencheng Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I136765683","display_name":"Tianjin University of Technology","ror":"https://ror.org/00zbe0w13","country_code":"CN","type":"education","lineage":["https://openalex.org/I136765683"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wencheng Zhu","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University\nHaihe Laboratory of Information Technology Application Innovation"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University\nHaihe Laboratory of Information Technology Application Innovation","institution_ids":["https://openalex.org/I136765683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129717847","display_name":"Huiying Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I135237710","display_name":"Zhejiang Normal University","ror":"https://ror.org/01vevwk45","country_code":"CN","type":"education","lineage":["https://openalex.org/I135237710"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huiying Xu","raw_affiliation_strings":["School of Computer Science and Technology, Zhejiang Normal University"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Normal University","institution_ids":["https://openalex.org/I135237710"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129675085","display_name":"Xinzhong Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I135237710","display_name":"Zhejiang Normal University","ror":"https://ror.org/01vevwk45","country_code":"CN","type":"education","lineage":["https://openalex.org/I135237710"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinzhong Zhu","raw_affiliation_strings":["School of Computer Science and Technology, Zhejiang Normal University"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Normal University","institution_ids":["https://openalex.org/I135237710"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129688204","display_name":"Pengfei Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengfei Zhu","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University","institution_ids":["https://openalex.org/I162868743"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5129751469"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70588235,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"8","first_page":"6145","last_page":"6153"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9745000004768372,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9745000004768372,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.0044999998062849045,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.0024999999441206455,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6442000269889832},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5871999859809875},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.4408999979496002},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4293999969959259},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.4251999855041504},{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.40610000491142273},{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.3910999894142151},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.35690000653266907}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7171000242233276},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6442000269889832},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5871999859809875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5041000247001648},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.4408999979496002},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4293999969959259},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.4251999855041504},{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.40610000491142273},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3862999975681305},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.35690000653266907},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3370000123977661},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C93372532","wikidata":"https://www.wikidata.org/wiki/Q6552455","display_name":"Linde\u2013Buzo\u2013Gray algorithm","level":3,"score":0.26969999074935913},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2671999931335449},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.26499998569488525},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26489999890327454},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i8.37539","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i8.37539","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37539/41501","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i8.37539","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i8.37539","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37539/41501","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1585402135","display_name":null,"funder_award_id":"62222608","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2802911279","display_name":null,"funder_award_id":"Young","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4020255992","display_name":null,"funder_award_id":"Project","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5532155222","display_name":null,"funder_award_id":"Tianjin","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"},{"id":"https://openalex.org/G5854786607","display_name":null,"funder_award_id":"Tianjin","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7077580569","display_name":null,"funder_award_id":"62436002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323993","display_name":"Natural Science Foundation of Tianjin City","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138333786.pdf","grobid_xml":"https://content.openalex.org/works/W7138333786.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vector":[0],"quantization":[1,63,117,154],"has":[2],"emerged":[3],"as":[4,44,93],"a":[5,59,115],"powerful":[6],"tool":[7],"in":[8,39,50,133],"large-scale":[9],"multimodal":[10,45,61],"models,":[11],"unifying":[12],"heterogeneous":[13],"representations":[14,135],"through":[15,87],"discrete":[16],"token":[17],"encoding.":[18],"However,":[19],"its":[20,48],"effectiveness":[21,168],"hinges":[22],"on":[23,31,158],"robust":[24,94],"codebook":[25],"design.":[26],"Current":[27],"prototype-based":[28],"approaches":[29],"relying":[30],"trainable":[32],"vectors":[33],"or":[34],"clustered":[35],"centroids":[36],"fall":[37],"short":[38],"representativeness":[40],"and":[41,97,122,129,140,161],"interpretability,":[42],"even":[43],"alignment":[46],"demonstrates":[47],"promise":[49],"vision-language":[51,109],"models.":[52],"To":[53],"address":[54],"these":[55,105],"limitations,":[56],"we":[57,144],"propose":[58],"simple":[60],"prompting-driven":[62],"framework":[64,113],"for":[65],"point":[66],"cloud":[67],"analysis.":[68],"Our":[69],"methodology":[70],"is":[71],"built":[72],"upon":[73],"two":[74],"core":[75],"insights:":[76],"1)":[77],"Text":[78],"embeddings":[79],"from":[80],"pre-trained":[81],"models":[82],"inherently":[83],"encode":[84,138],"visual":[85,128],"semantics":[86],"many-to-one":[88],"contrastive":[89],"alignment,":[90],"naturally":[91],"serving":[92],"prototype":[95,130],"priors;":[96],"2)":[98],"Multimodal":[99],"prompts":[100],"enable":[101],"adaptive":[102],"refinement":[103],"of":[104,169],"prototypes,":[106],"effectively":[107],"mitigating":[108],"semantic":[110,141],"gaps.":[111],"The":[112],"introduces":[114],"dual-constrained":[116],"space,":[118],"enforced":[119],"by":[120],"compactness":[121],"separation":[123],"regularization,":[124],"which":[125],"seamlessly":[126],"integrates":[127],"features,":[131],"resulting":[132],"hybrid":[134],"that":[136],"jointly":[137],"geometric":[139],"information.":[142],"Furthermore,":[143],"employ":[145],"Gumbel-Softmax":[146],"relaxation":[147],"to":[148],"achieve":[149],"differentiable":[150],"discretization":[151],"while":[152],"maintaining":[153],"sparsity.":[155],"Extensive":[156],"experiments":[157],"the":[159,166,170],"ModelNet40":[160],"ScanObjectNN":[162],"datasets":[163],"clearly":[164],"demonstrate":[165],"superior":[167],"proposed":[171],"method.":[172]},"counts_by_year":[],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2026-03-18T00:00:00"}
