{"id":"https://openalex.org/W3115625379","doi":"https://doi.org/10.1145/3426826.3426840","title":"Estimating the Number of Clusters via Proportional Chinese Restaurant Process","display_name":"Estimating the Number of Clusters via Proportional Chinese Restaurant Process","publication_year":2020,"publication_date":"2020-09-18","ids":{"openalex":"https://openalex.org/W3115625379","doi":"https://doi.org/10.1145/3426826.3426840","mag":"3115625379"},"language":"en","primary_location":{"id":"doi:10.1145/3426826.3426840","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3426826.3426840","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 The 3rd International Conference on Machine Learning and Machine Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008721062","display_name":"Yingying Wen","orcid":"https://orcid.org/0000-0001-7469-4066"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingying Wen","raw_affiliation_strings":["Zhejiang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039775525","display_name":"Hangjin Jiang","orcid":"https://orcid.org/0000-0002-3905-7325"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hangjin Jiang","raw_affiliation_strings":["Zhejiang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069353502","display_name":"Jianwei Yin","orcid":"https://orcid.org/0000-0003-4703-7348"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwei Yin","raw_affiliation_strings":["Zhejiang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18041394,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"70","last_page":"77"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9416999816894531,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9320999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.6875756978988647},{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.6456423997879028},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.605661928653717},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5620931386947632},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.536439061164856},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4577312767505646},{"id":"https://openalex.org/keywords/dirichlet-distribution","display_name":"Dirichlet distribution","score":0.44206932187080383},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.33091193437576294},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0992690920829773},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08592617511749268}],"concepts":[{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.6875756978988647},{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.6456423997879028},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.605661928653717},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5620931386947632},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.536439061164856},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4577312767505646},{"id":"https://openalex.org/C169214877","wikidata":"https://www.wikidata.org/wiki/Q981016","display_name":"Dirichlet distribution","level":3,"score":0.44206932187080383},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33091193437576294},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0992690920829773},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08592617511749268},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C182310444","wikidata":"https://www.wikidata.org/wiki/Q1332643","display_name":"Boundary value problem","level":2,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3426826.3426840","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3426826.3426840","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 The 3rd International Conference on Machine Learning and Machine Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1596294641","https://openalex.org/W1613448136","https://openalex.org/W1864426711","https://openalex.org/W1968729950","https://openalex.org/W1984881674","https://openalex.org/W1997158470","https://openalex.org/W2011342110","https://openalex.org/W2012039831","https://openalex.org/W2053186076","https://openalex.org/W2087309226","https://openalex.org/W2104827998","https://openalex.org/W2147307434","https://openalex.org/W2151388649","https://openalex.org/W2163738067","https://openalex.org/W2168162876","https://openalex.org/W2618735189","https://openalex.org/W2769635192","https://openalex.org/W2785975632","https://openalex.org/W2953322088","https://openalex.org/W4235169531","https://openalex.org/W4299512641"],"related_works":["https://openalex.org/W2950577598","https://openalex.org/W1558456818","https://openalex.org/W2017683341","https://openalex.org/W2020478166","https://openalex.org/W2330172022","https://openalex.org/W2061370939","https://openalex.org/W1653282108","https://openalex.org/W4287323310","https://openalex.org/W2063323033","https://openalex.org/W4313644249"],"abstract_inverted_index":{"Dirichlet":[0],"Process":[1,56,89],"Mixture":[2],"(DPM)":[3],"models":[4,117],"tend":[5],"to":[6,60],"produce":[7],"some":[8],"major":[9,24],"clusters":[10,19,41,123],"along":[11],"with":[12,23,113],"many":[13],"small":[14,17,39,64,103],"clusters.":[15,25,65,104],"These":[16],"confusing":[18],"are":[20],"highly":[21],"overlapped":[22],"As":[26],"the":[27,33,38,49,62,69,93,99,107,120],"size":[28],"of":[29,35,75,95,101,122],"samples":[30],"increasing":[31],"without":[32],"change":[34],"sample":[36],"distribution,":[37],"unnecessary":[40,102],"would":[42],"be":[43],"introduced":[44],"more":[45,47],"and":[46,71,115,118],"in":[48],"cluster":[50],"results.":[51],"Recently,":[52],"powered":[53],"Chinese":[54,87],"Restaurant":[55,88],"(pCRP)":[57],"is":[58],"purposed":[59],"eliminate":[61],"counterfactual":[63],"However,":[66],"it":[67],"violates":[68],"usual":[70],"indispensable":[72],"exchangeability":[73,96],"assumption":[74],"DPM.":[76],"In":[77],"this":[78],"paper,":[79],"we":[80],"propose":[81],"a":[82],"new":[83],"method":[84],"called":[85],"proportional":[86],"(pro-CRP)":[90],"that":[91],"keeps":[92],"property":[94],"while":[97],"reduces":[98],"number":[100,121],"We":[105],"show":[106],"experiment":[108],"results":[109],"on":[110],"comparing":[111],"pro-CRP":[112],"CRP":[114],"pCRP":[116],"prove":[119],"reduced":[124],"by":[125],"pro-CRP.":[126]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
