{"id":"https://openalex.org/W4400246824","doi":"https://doi.org/10.1007/s00357-024-09480-4","title":"A New Look at the Dirichlet Distribution: Robustness, Clustering, and Both Together","display_name":"A New Look at the Dirichlet Distribution: Robustness, Clustering, and Both Together","publication_year":2024,"publication_date":"2024-07-02","ids":{"openalex":"https://openalex.org/W4400246824","doi":"https://doi.org/10.1007/s00357-024-09480-4"},"language":"en","primary_location":{"id":"doi:10.1007/s00357-024-09480-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00357-024-09480-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00357-024-09480-4.pdf","source":{"id":"https://openalex.org/S73028643","display_name":"Journal of Classification","issn_l":"0176-4268","issn":["0176-4268","1432-1343"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Classification","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00357-024-09480-4.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015878679","display_name":"Salvatore D. Tomarchio","orcid":"https://orcid.org/0000-0003-2690-8546"},"institutions":[{"id":"https://openalex.org/I39063666","display_name":"University of Catania","ror":"https://ror.org/03a64bh57","country_code":"IT","type":"education","lineage":["https://openalex.org/I39063666"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Salvatore D. Tomarchio","raw_affiliation_strings":["Department of Economics and Business, University of Catania, Catania, Italy"],"raw_orcid":"https://orcid.org/0000-0003-2690-8546","affiliations":[{"raw_affiliation_string":"Department of Economics and Business, University of Catania, Catania, Italy","institution_ids":["https://openalex.org/I39063666"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009939605","display_name":"Antonio Punzo","orcid":"https://orcid.org/0000-0001-7742-1821"},"institutions":[{"id":"https://openalex.org/I39063666","display_name":"University of Catania","ror":"https://ror.org/03a64bh57","country_code":"IT","type":"education","lineage":["https://openalex.org/I39063666"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Antonio Punzo","raw_affiliation_strings":["Department of Economics and Business, University of Catania, Catania, Italy"],"raw_orcid":"https://orcid.org/0000-0001-7742-1821","affiliations":[{"raw_affiliation_string":"Department of Economics and Business, University of Catania, Catania, Italy","institution_ids":["https://openalex.org/I39063666"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063817631","display_name":"Johan Ferreira","orcid":"https://orcid.org/0000-0002-5945-6550"},"institutions":[{"id":"https://openalex.org/I69552723","display_name":"University of Pretoria","ror":"https://ror.org/00g0p6g84","country_code":"ZA","type":"education","lineage":["https://openalex.org/I69552723"]}],"countries":["ZA"],"is_corresponding":false,"raw_author_name":"Johannes T. Ferreira","raw_affiliation_strings":["Department of Statistics, University of Pretoria, Pretoria, South Africa"],"raw_orcid":"https://orcid.org/0000-0002-5945-6550","affiliations":[{"raw_affiliation_string":"Department of Statistics, University of Pretoria, Pretoria, South Africa","institution_ids":["https://openalex.org/I69552723"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024962335","display_name":"Andri\u00ebtte Bekker","orcid":"https://orcid.org/0000-0003-4793-5674"},"institutions":[{"id":"https://openalex.org/I4210161783","display_name":"GeoInformation (United Kingdom)","ror":"https://ror.org/05t4zqc79","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210161783"]},{"id":"https://openalex.org/I69552723","display_name":"University of Pretoria","ror":"https://ror.org/00g0p6g84","country_code":"ZA","type":"education","lineage":["https://openalex.org/I69552723"]}],"countries":["GB","ZA"],"is_corresponding":false,"raw_author_name":"Andriette Bekker","raw_affiliation_strings":["Department of Geography, Geoinformatics and Meteorology, Centre for Environmental Studies, Pretoria, South Africa","Department of Statistics, University of Pretoria, Pretoria, South Africa"],"raw_orcid":"https://orcid.org/0000-0003-4793-5674","affiliations":[{"raw_affiliation_string":"Department of Geography, Geoinformatics and Meteorology, Centre for Environmental Studies, Pretoria, South Africa","institution_ids":["https://openalex.org/I4210161783"]},{"raw_affiliation_string":"Department of Statistics, University of Pretoria, Pretoria, South Africa","institution_ids":["https://openalex.org/I69552723"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5015878679"],"corresponding_institution_ids":["https://openalex.org/I39063666"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":3.9736,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.94316952,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"42","issue":"1","first_page":"31","last_page":"53"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9609000086784363,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10968","display_name":"Statistical Distribution Estimation and Applications","score":0.9552000164985657,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6778256297111511},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6311905384063721},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.5453935265541077},{"id":"https://openalex.org/keywords/dirichlet-distribution","display_name":"Dirichlet distribution","score":0.5217182040214539},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48450562357902527},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48077934980392456},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.47188273072242737},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.37716376781463623},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3666112422943115},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.17511719465255737},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.1058671772480011},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.07385805249214172},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.07016444206237793}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6778256297111511},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6311905384063721},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5453935265541077},{"id":"https://openalex.org/C169214877","wikidata":"https://www.wikidata.org/wiki/Q981016","display_name":"Dirichlet distribution","level":3,"score":0.5217182040214539},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48450562357902527},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48077934980392456},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.47188273072242737},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.37716376781463623},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3666112422943115},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.17511719465255737},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.1058671772480011},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.07385805249214172},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.07016444206237793},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C182310444","wikidata":"https://www.wikidata.org/wiki/Q1332643","display_name":"Boundary value problem","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s00357-024-09480-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00357-024-09480-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00357-024-09480-4.pdf","source":{"id":"https://openalex.org/S73028643","display_name":"Journal of Classification","issn_l":"0176-4268","issn":["0176-4268","1432-1343"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Classification","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:spr:jclass:v:42:y:2025:i:1:d:10.1007_s00357-024-09480-4","is_oa":false,"landing_page_url":"http://link.springer.com/10.1007/s00357-024-09480-4","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s00357-024-09480-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00357-024-09480-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00357-024-09480-4.pdf","source":{"id":"https://openalex.org/S73028643","display_name":"Journal of Classification","issn_l":"0176-4268","issn":["0176-4268","1432-1343"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Classification","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7111560266","display_name":null,"funder_award_id":"2024-033-STA","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G7641518323","display_name":null,"funder_award_id":"RA201125576565","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G8613244077","display_name":null,"funder_award_id":"SRUG2204203865","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320320692","display_name":"University of Pretoria","ror":"https://ror.org/00g0p6g84"},{"id":"https://openalex.org/F4320322690","display_name":"Universit\u00e0 di Catania","ror":"https://ror.org/03a64bh57"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4400246824.pdf"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W374884248","https://openalex.org/W402407836","https://openalex.org/W571770348","https://openalex.org/W584423923","https://openalex.org/W1598920400","https://openalex.org/W1965342088","https://openalex.org/W2002615595","https://openalex.org/W2005643467","https://openalex.org/W2019470638","https://openalex.org/W2023163585","https://openalex.org/W2029698240","https://openalex.org/W2040052188","https://openalex.org/W2045978762","https://openalex.org/W2049633694","https://openalex.org/W2063690800","https://openalex.org/W2082301243","https://openalex.org/W2082503527","https://openalex.org/W2120323899","https://openalex.org/W2130444042","https://openalex.org/W2137971377","https://openalex.org/W2152594362","https://openalex.org/W2166698530","https://openalex.org/W2168175751","https://openalex.org/W2171074980","https://openalex.org/W2326950840","https://openalex.org/W2461217117","https://openalex.org/W2492307518","https://openalex.org/W2524681876","https://openalex.org/W2796157596","https://openalex.org/W2797746357","https://openalex.org/W2898818720","https://openalex.org/W2904250115","https://openalex.org/W2942670250","https://openalex.org/W2955104602","https://openalex.org/W2963702653","https://openalex.org/W2999527243","https://openalex.org/W3000212246","https://openalex.org/W3014839920","https://openalex.org/W3040917674","https://openalex.org/W3174357322","https://openalex.org/W3197481465","https://openalex.org/W4200633511","https://openalex.org/W4235169531","https://openalex.org/W4236654676","https://openalex.org/W4243269039","https://openalex.org/W4253803149","https://openalex.org/W4280604439","https://openalex.org/W6641757280","https://openalex.org/W6681498133"],"related_works":["https://openalex.org/W3126382579","https://openalex.org/W3107650560","https://openalex.org/W4315588616","https://openalex.org/W4317422773","https://openalex.org/W2810542905","https://openalex.org/W2129350855","https://openalex.org/W2891616219","https://openalex.org/W2796920963","https://openalex.org/W2497860580","https://openalex.org/W3204672119"],"abstract_inverted_index":{"Abstract":[0],"Compositional":[1],"data":[2,123,135],"have":[3],"peculiar":[4],"characteristics":[5],"that":[6,63],"pose":[7],"significant":[8],"challenges":[9],"to":[10,85,124],"traditional":[11],"statistical":[12],"methods":[13],"and":[14,46,93,134,137,150],"models.":[15],"Within":[16],"this":[17],"framework,":[18],"we":[19,34,49,78],"use":[20],"a":[21,56,66],"convenient":[22],"mode":[23],"parametrized":[24],"Dirichlet":[25,40],"distribution":[26,62],"across":[27],"multiple":[28],"fields":[29],"of":[30,38,59,74,82,91,128],"statistics.":[31],"In":[32],"particular,":[33],"propose":[35,79],"finite":[36,80],"mixtures":[37,81],"unimodal":[39],"(UD)":[41],"distributions":[42,84],"for":[43,65,88],"model-based":[44],"clustering":[45],"classification.":[47],"Then,":[48],"introduce":[50],"the":[51,60,72,89,97,107,126,151],"contaminated":[52],"UD":[53,61],"(CUD)":[54],"distribution,":[55],"heavy-tailed":[57],"generalization":[58],"allows":[64],"more":[67],"flexible":[68],"tail":[69],"behavior":[70],"in":[71,96],"presence":[73,90],"atypical":[75,94,129],"observations.":[76],"Thirdly,":[77],"CUD":[83],"jointly":[86],"account":[87],"clusters":[92],"points":[95],"data.":[98],"Parameter":[99],"estimation":[100,133],"is":[101],"carried":[102],"out":[103],"by":[104,111],"directly":[105],"maximizing":[106],"maximum":[108],"likelihood":[109],"or":[110],"using":[112],"an":[113],"expectation-maximization":[114],"(EM)":[115],"algorithm.":[116],"Two":[117],"analyses":[118],"are":[119,148,157],"conducted":[120],"on":[121,131],"simulated":[122],"illustrate":[125],"effects":[127],"observations":[130],"parameter":[132],"classification,":[136],"how":[138],"our":[139,155],"proposals":[140],"address":[141],"both":[142],"aspects.":[143],"Furthermore,":[144],"two":[145],"real":[146],"datasets":[147],"investigated":[149],"results":[152],"obtained":[153],"via":[154],"models":[156],"discussed.":[158]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-10-10T00:00:00"}
