{"id":"https://openalex.org/W2524305182","doi":"https://doi.org/10.1109/tnnls.2016.2608354","title":"Cluster Validation Method for Determining the Number of Clusters in Categorical Sequences","display_name":"Cluster Validation Method for Determining the Number of Clusters in Categorical Sequences","publication_year":2016,"publication_date":"2016-09-27","ids":{"openalex":"https://openalex.org/W2524305182","doi":"https://doi.org/10.1109/tnnls.2016.2608354","mag":"2524305182","pmid":"https://pubmed.ncbi.nlm.nih.gov/28114078"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2016.2608354","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2016.2608354","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101637886","display_name":"Gongde Guo","orcid":"https://orcid.org/0000-0002-5118-7261"},"institutions":[{"id":"https://openalex.org/I111753288","display_name":"Fujian Normal University","ror":"https://ror.org/020azk594","country_code":"CN","type":"education","lineage":["https://openalex.org/I111753288"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gongde Guo","raw_affiliation_strings":["School of Mathematics and Computer Science, Fujian Normal University, Fuzhou China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Computer Science, Fujian Normal University, Fuzhou China","institution_ids":["https://openalex.org/I111753288"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091369584","display_name":"Lifei Chen","orcid":"https://orcid.org/0000-0003-3568-8899"},"institutions":[{"id":"https://openalex.org/I111753288","display_name":"Fujian Normal University","ror":"https://ror.org/020azk594","country_code":"CN","type":"education","lineage":["https://openalex.org/I111753288"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lifei Chen","raw_affiliation_strings":["School of Mathematics and Computer Science, Fujian Normal University, Fuzhou China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Computer Science, Fujian Normal University, Fuzhou China","institution_ids":["https://openalex.org/I111753288"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101586436","display_name":"Yanfang Ye","orcid":"https://orcid.org/0000-0001-8376-7239"},"institutions":[{"id":"https://openalex.org/I12097938","display_name":"West Virginia University","ror":"https://ror.org/011vxgd24","country_code":"US","type":"education","lineage":["https://openalex.org/I12097938"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanfang Ye","raw_affiliation_strings":["Lane Department of Computer Science and Electrical Engineering , West Virginia University , Morgantown , WV , USA"],"affiliations":[{"raw_affiliation_string":"Lane Department of Computer Science and Electrical Engineering , West Virginia University , Morgantown , WV , USA","institution_ids":["https://openalex.org/I12097938"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052377100","display_name":"Qingshan Jiang","orcid":"https://orcid.org/0000-0002-8040-0308"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingshan Jiang","raw_affiliation_strings":["Shenzhen Key Laboratory for High Performance Data Mining, Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Key Laboratory for High Performance Data Mining, Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101637886"],"corresponding_institution_ids":["https://openalex.org/I111753288"],"apc_list":null,"apc_paid":null,"fwci":3.0484,"has_fulltext":false,"cited_by_count":48,"citation_normalized_percentile":{"value":0.91657036,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"28","issue":"12","first_page":"2936","last_page":"2948"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.7789358496665955},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7781134843826294},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.6463296413421631},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5973129272460938},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5890712738037109},{"id":"https://openalex.org/keywords/determining-the-number-of-clusters-in-a-data-set","display_name":"Determining the number of clusters in a data set","score":0.471680223941803},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.46314287185668945},{"id":"https://openalex.org/keywords/single-linkage-clustering","display_name":"Single-linkage clustering","score":0.4554121792316437},{"id":"https://openalex.org/keywords/fuzzy-clustering","display_name":"Fuzzy clustering","score":0.4520539939403534},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.4488162100315094},{"id":"https://openalex.org/keywords/consensus-clustering","display_name":"Consensus clustering","score":0.4397290349006653},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4260023236274719},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42390257120132446},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.32466787099838257},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.27876657247543335},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2766833007335663}],"concepts":[{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.7789358496665955},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7781134843826294},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.6463296413421631},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5973129272460938},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5890712738037109},{"id":"https://openalex.org/C149872217","wikidata":"https://www.wikidata.org/wiki/Q5265701","display_name":"Determining the number of clusters in a data set","level":5,"score":0.471680223941803},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.46314287185668945},{"id":"https://openalex.org/C22648726","wikidata":"https://www.wikidata.org/wiki/Q7523744","display_name":"Single-linkage clustering","level":5,"score":0.4554121792316437},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.4520539939403534},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.4488162100315094},{"id":"https://openalex.org/C186767784","wikidata":"https://www.wikidata.org/wiki/Q5162841","display_name":"Consensus clustering","level":5,"score":0.4397290349006653},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4260023236274719},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42390257120132446},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32466787099838257},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.27876657247543335},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2766833007335663},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2016.2608354","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2016.2608354","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:28114078","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/28114078","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3115418889","display_name":null,"funder_award_id":"2015J01238","funder_id":"https://openalex.org/F4320321878","funder_display_name":"Natural Science Foundation of Fujian Province"},{"id":"https://openalex.org/G32186264","display_name":null,"funder_award_id":"61175123","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6189876786","display_name":null,"funder_award_id":"CNS-1618629","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6925082703","display_name":null,"funder_award_id":"61672157","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321878","display_name":"Natural Science Foundation of Fujian Province","ror":null},{"id":"https://openalex.org/F4320321935","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W8488631","https://openalex.org/W70833783","https://openalex.org/W286152367","https://openalex.org/W845171161","https://openalex.org/W1536018596","https://openalex.org/W1585610988","https://openalex.org/W1673310716","https://openalex.org/W1973243276","https://openalex.org/W1974364887","https://openalex.org/W1978176329","https://openalex.org/W1987971958","https://openalex.org/W1990368529","https://openalex.org/W1996747841","https://openalex.org/W2008711923","https://openalex.org/W2009435671","https://openalex.org/W2032227337","https://openalex.org/W2032345031","https://openalex.org/W2043793719","https://openalex.org/W2047191928","https://openalex.org/W2051224630","https://openalex.org/W2085487226","https://openalex.org/W2102177745","https://openalex.org/W2107402227","https://openalex.org/W2108122721","https://openalex.org/W2113859276","https://openalex.org/W2115077250","https://openalex.org/W2116324873","https://openalex.org/W2116442055","https://openalex.org/W2119894516","https://openalex.org/W2122051577","https://openalex.org/W2125779688","https://openalex.org/W2126626732","https://openalex.org/W2142318161","https://openalex.org/W2142635246","https://openalex.org/W2148425841","https://openalex.org/W2148900457","https://openalex.org/W2153233077","https://openalex.org/W2155422470","https://openalex.org/W2156606946","https://openalex.org/W2157305948","https://openalex.org/W2163993443","https://openalex.org/W2166647826","https://openalex.org/W2168175751","https://openalex.org/W2171963266","https://openalex.org/W2319660501","https://openalex.org/W2338257905","https://openalex.org/W2395916081","https://openalex.org/W4231339208","https://openalex.org/W6602877399","https://openalex.org/W6635035540","https://openalex.org/W6637131181","https://openalex.org/W6675941702"],"related_works":["https://openalex.org/W2129417512","https://openalex.org/W2406185607","https://openalex.org/W2141140100","https://openalex.org/W4230135178","https://openalex.org/W2982243238","https://openalex.org/W4231226332","https://openalex.org/W2263992973","https://openalex.org/W2371540751","https://openalex.org/W2146121510","https://openalex.org/W2067418549"],"abstract_inverted_index":{"Cluster":[0],"validation,":[1],"which":[2,41,137],"is":[3,65,100,134],"the":[4,8,53,70,81,108,120,139,147,151,166,172,179,196,211,214],"process":[5],"of":[6,10,62,72,105,122,131,153,181,213],"evaluating":[7],"quality":[9,121],"clustering":[11,64,130,144,163],"results,":[12],"plays":[13],"an":[14,73,157],"important":[15],"role":[16],"for":[17,57,128],"practical":[18],"machine":[19],"learning":[20],"systems.":[21],"Categorical":[22],"sequences,":[23],"such":[24],"as":[25,102],"biological":[26],"sequences":[27,63,133,194],"in":[28,34,47,85,91,183],"computational":[29],"biology,":[30],"have":[31],"become":[32],"common":[33,173],"real-world":[35,201],"applications.":[36],"Different":[37],"from":[38,204],"previous":[39],"studies,":[40],"mainly":[42],"focused":[43],"on":[44,52,190,199],"attribute-value":[45],"data,":[46],"this":[48,89,92],"paper,":[49,93],"we":[50],"work":[51],"cluster":[54,96],"validation":[55,75],"problem":[56],"categorical":[58,132,184],"sequences.":[59,86],"The":[60,161],"evaluation":[61],"currently":[66],"difficult":[67],"due":[68],"to":[69,80,118,177,209],"lack":[71],"internal":[74],"criterion":[76],"defined":[77],"with":[78,107,142],"regard":[79],"structural":[82,110,114],"features":[83],"hidden":[84],"To":[87],"solve":[88],"problem,":[90],"a":[94,103],"novel":[95],"validity":[97],"index":[98],"(CVI)":[99],"proposed":[101,215],"function":[104],"clustering,":[106],"intracluster":[109],"compactness":[111],"and":[112,150,165,195],"intercluster":[113],"separation":[115],"linearly":[116],"combined":[117],"measure":[119,141],"sequence":[123,185,202],"clusters.":[124],"A":[125,187],"partition-based":[126],"algorithm":[127,164],"robust":[129],"also":[135],"proposed,":[136],"provides":[138],"new":[140,162],"high-quality":[143],"results":[145,198],"by":[146],"deterministic":[148],"initialization":[149],"elimination":[152],"noise":[154],"clusters":[155,182],"using":[156],"information":[158],"theoretic":[159],"method.":[160,216],"CVI":[167],"are":[168,207],"then":[169],"assembled":[170],"within":[171],"model":[174],"selection":[175],"procedure":[176],"determine":[178],"number":[180],"sets.":[186],"case":[188],"study":[189],"commonly":[191],"used":[192],"protein":[193],"experimental":[197],"some":[200],"sets":[203],"different":[205],"domains":[206],"given":[208],"demonstrate":[210],"performance":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":2}],"updated_date":"2026-03-04T09:10:02.777135","created_date":"2025-10-10T00:00:00"}
