{"id":"https://openalex.org/W2571274719","doi":"https://doi.org/10.5220/0004828202550262","title":"Kernel Hierarchical Agglomerative Clustering - Comparison of Different Gap Statistics to Estimate the Number of Clusters","display_name":"Kernel Hierarchical Agglomerative Clustering - Comparison of Different Gap Statistics to Estimate the Number of Clusters","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2571274719","doi":"https://doi.org/10.5220/0004828202550262","mag":"2571274719"},"language":"en","primary_location":{"id":"doi:10.5220/0004828202550262","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004828202550262","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd International Conference on Pattern Recognition Applications and Methods","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0004828202550262","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100368048","display_name":"Na Li","orcid":"https://orcid.org/0000-0001-9545-3050"},"institutions":[{"id":"https://openalex.org/I140494188","display_name":"Universit\u00e9 de Technologie de Troyes","ror":"https://ror.org/01qhqcj41","country_code":"FR","type":"education","lineage":["https://openalex.org/I140494188"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Na Li","raw_affiliation_strings":["LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)","institution_ids":["https://openalex.org/I140494188"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029849846","display_name":"Nicolas Lef\u00e8bvre","orcid":null},"institutions":[{"id":"https://openalex.org/I140494188","display_name":"Universit\u00e9 de Technologie de Troyes","ror":"https://ror.org/01qhqcj41","country_code":"FR","type":"education","lineage":["https://openalex.org/I140494188"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Nicolas Lefebvre","raw_affiliation_strings":["LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)","institution_ids":["https://openalex.org/I140494188"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087789216","display_name":"R\u00e9gis Lengelle","orcid":"https://orcid.org/0000-0002-3538-3799"},"institutions":[{"id":"https://openalex.org/I140494188","display_name":"Universit\u00e9 de Technologie de Troyes","ror":"https://ror.org/01qhqcj41","country_code":"FR","type":"education","lineage":["https://openalex.org/I140494188"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"R\u00e9gis Lengell\u00e9","raw_affiliation_strings":["LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LM2S - Laboratoire Mod\u00e9lisation et S\u00fbret\u00e9 des Syst\u00e8mes (UTT - 12, rue Marie Curie - BP 2060 - 10010 TROYES CEDEX - France)","institution_ids":["https://openalex.org/I140494188"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4229,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.7859041,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"255","last_page":"262"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9835000038146973,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7614426612854004},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.6915422677993774},{"id":"https://openalex.org/keywords/dendrogram","display_name":"Dendrogram","score":0.6612372398376465},{"id":"https://openalex.org/keywords/brown-clustering","display_name":"Brown clustering","score":0.6515339016914368},{"id":"https://openalex.org/keywords/hierarchical-clustering-of-networks","display_name":"Hierarchical clustering of networks","score":0.6032209992408752},{"id":"https://openalex.org/keywords/single-linkage-clustering","display_name":"Single-linkage clustering","score":0.5938873887062073},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5809715986251831},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.48236483335494995},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4794141948223114},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.46771755814552307},{"id":"https://openalex.org/keywords/statistic","display_name":"Statistic","score":0.46716487407684326},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4484920799732208},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.44345614314079285},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4131774306297302},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.38967445492744446},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.26440995931625366}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7614426612854004},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.6915422677993774},{"id":"https://openalex.org/C172312944","wikidata":"https://www.wikidata.org/wiki/Q1957903","display_name":"Dendrogram","level":4,"score":0.6612372398376465},{"id":"https://openalex.org/C167984511","wikidata":"https://www.wikidata.org/wiki/Q17003931","display_name":"Brown clustering","level":5,"score":0.6515339016914368},{"id":"https://openalex.org/C82261393","wikidata":"https://www.wikidata.org/wiki/Q17038699","display_name":"Hierarchical clustering of networks","level":5,"score":0.6032209992408752},{"id":"https://openalex.org/C22648726","wikidata":"https://www.wikidata.org/wiki/Q7523744","display_name":"Single-linkage clustering","level":5,"score":0.5938873887062073},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5809715986251831},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.48236483335494995},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4794141948223114},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.46771755814552307},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.46716487407684326},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4484920799732208},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.44345614314079285},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4131774306297302},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.38967445492744446},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.26440995931625366},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C81977670","wikidata":"https://www.wikidata.org/wiki/Q585259","display_name":"Genetic diversity","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5220/0004828202550262","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004828202550262","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd International Conference on Pattern Recognition Applications and Methods","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.5220/0004828202550262","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0004828202550262","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd International Conference on Pattern Recognition Applications and Methods","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2488882714","https://openalex.org/W1602287844","https://openalex.org/W2384052049","https://openalex.org/W2062059194","https://openalex.org/W2385630304","https://openalex.org/W4241767317","https://openalex.org/W2087424554","https://openalex.org/W1957537378","https://openalex.org/W2367205823","https://openalex.org/W4220814143"],"abstract_inverted_index":{"Clustering":[0],"algorithms,":[1],"as":[2],"unsupervised":[3],"analysis":[4],"tools,":[5],"are":[6],"useful":[7],"for":[8],"exploring":[9],"data":[10,53],"structure":[11],"and":[12,36,72,88],"have":[13],"owned\r\n\r\ngreat":[14],"success":[15],"in":[16],"many":[17],"disciplines.":[18],"For":[19],"most":[20,41],"of":[21,39,50,76,86,111,113,122],"the":[22,28,30,40,48,56,69,74,84,89,109,119,123],"clustering":[23,60],"algorithms":[24],"like":[25],"k-means,":[26],"determining":[27],"number\r\n\r\nof":[29],"clusters":[31,87],"is":[32,37],"a":[33,52],"crucial":[34],"step":[35],"one":[38],"difficult":[42],"problems.":[43],"Hierarchical":[44,125],"Agglomerative":[45],"Clustering\r\n\r\n(HAC)":[46],"has":[47,94],"advantage":[49],"giving":[51],"representation":[54],"by":[55,61,92],"dendrogram":[57,63],"that":[58],"allows":[59],"cutting\r\n\r\nthe":[62],"at":[64],"some":[65,102],"optimal":[66],"level.":[67],"In":[68,97],"past":[70],"years":[71],"within":[73],"context":[75],"HAC,":[77],"efficient":[78],"statistics":[79],"have\r\n\r\nbeen":[80],"proposed":[81],"to":[82,106],"estimate":[83],"number":[85],"Gap":[90,104],"Statistic":[91],"Tibshirani":[93],"shown":[95],"interesting\r\n\r\nperformances.":[96],"this":[98],"paper,":[99],"we":[100],"propose":[101],"new":[103],"Statistics":[105],"further":[107],"improve":[108],"determination":[110],"the\r\n\r\nnumber":[112],"clusters.":[114],"Our":[115],"works":[116],"focus":[117],"on":[118],"kernelized":[120],"version":[121],"widely-used":[124],"Clustering\r\n\r\nAlgorithm.":[126]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2017-01-13T00:00:00"}
