{"id":"https://openalex.org/W2082888943","doi":"https://doi.org/10.3390/e17031535","title":"Clustering Heterogeneous Data with k-Means by Mutual Information-Based Unsupervised Feature Transformation","display_name":"Clustering Heterogeneous Data with k-Means by Mutual Information-Based Unsupervised Feature Transformation","publication_year":2015,"publication_date":"2015-03-23","ids":{"openalex":"https://openalex.org/W2082888943","doi":"https://doi.org/10.3390/e17031535","mag":"2082888943"},"language":"en","primary_location":{"id":"doi:10.3390/e17031535","is_oa":true,"landing_page_url":"https://doi.org/10.3390/e17031535","pdf_url":"https://www.mdpi.com/1099-4300/17/3/1535/pdf?version=1427106763","source":{"id":"https://openalex.org/S195231649","display_name":"Entropy","issn_l":"1099-4300","issn":["1099-4300"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Entropy","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1099-4300/17/3/1535/pdf?version=1427106763","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015600800","display_name":"Min Wei","orcid":"https://orcid.org/0000-0003-4005-1331"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Min Wei","raw_affiliation_strings":["Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050716572","display_name":"Tommy W. S. Chow","orcid":"https://orcid.org/0000-0001-7051-0434"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Tommy Chow","raw_affiliation_strings":["Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010836514","display_name":"Rosa H. M. Chan","orcid":"https://orcid.org/0000-0003-4808-2490"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Rosa Chan","raw_affiliation_strings":["Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5015600800"],"corresponding_institution_ids":["https://openalex.org/I168719708"],"apc_list":{"value":2000,"currency":"CHF","value_usd":2165},"apc_paid":{"value":2000,"currency":"CHF","value_usd":2165},"fwci":3.5607,"has_fulltext":true,"cited_by_count":31,"citation_normalized_percentile":{"value":0.93633307,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"17","issue":"3","first_page":"1535","last_page":"1548"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8023102879524231},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.558239758014679},{"id":"https://openalex.org/keywords/hamming-distance","display_name":"Hamming distance","score":0.5188756585121155},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4834514558315277},{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.47974956035614014},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.4628303349018097},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.45537763833999634},{"id":"https://openalex.org/keywords/numerical-analysis","display_name":"Numerical analysis","score":0.45478782057762146},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.45421987771987915},{"id":"https://openalex.org/keywords/euclidean-distance","display_name":"Euclidean distance","score":0.4454249441623688},{"id":"https://openalex.org/keywords/hamming-code","display_name":"Hamming code","score":0.4418484568595886},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.44176286458969116},{"id":"https://openalex.org/keywords/clustering-high-dimensional-data","display_name":"Clustering high-dimensional data","score":0.4399029016494751},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4115096628665924},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3763558268547058}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8023102879524231},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.558239758014679},{"id":"https://openalex.org/C193319292","wikidata":"https://www.wikidata.org/wiki/Q272172","display_name":"Hamming distance","level":2,"score":0.5188756585121155},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4834514558315277},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.47974956035614014},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.4628303349018097},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.45537763833999634},{"id":"https://openalex.org/C48753275","wikidata":"https://www.wikidata.org/wiki/Q11216","display_name":"Numerical analysis","level":2,"score":0.45478782057762146},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.45421987771987915},{"id":"https://openalex.org/C120174047","wikidata":"https://www.wikidata.org/wiki/Q847073","display_name":"Euclidean distance","level":2,"score":0.4454249441623688},{"id":"https://openalex.org/C73150493","wikidata":"https://www.wikidata.org/wiki/Q853922","display_name":"Hamming code","level":4,"score":0.4418484568595886},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.44176286458969116},{"id":"https://openalex.org/C184509293","wikidata":"https://www.wikidata.org/wiki/Q5136711","display_name":"Clustering high-dimensional data","level":3,"score":0.4399029016494751},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4115096628665924},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3763558268547058},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C157125643","wikidata":"https://www.wikidata.org/wiki/Q884707","display_name":"Block code","level":3,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/e17031535","is_oa":true,"landing_page_url":"https://doi.org/10.3390/e17031535","pdf_url":"https://www.mdpi.com/1099-4300/17/3/1535/pdf?version=1427106763","source":{"id":"https://openalex.org/S195231649","display_name":"Entropy","issn_l":"1099-4300","issn":["1099-4300"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Entropy","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:5466143994154ec7bfda375da9b9f934","is_oa":true,"landing_page_url":"https://doaj.org/article/5466143994154ec7bfda375da9b9f934","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Entropy, Vol 17, Iss 3, Pp 1535-1548 (2015)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/1099-4300/17/3/1535/","is_oa":true,"landing_page_url":"http://dx.doi.org/10.3390/e17031535","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Entropy","raw_type":"Text"},{"id":"pmh:oai:pure.atira.dk:publications/8731773b-4aeb-412e-9171-1b069515e135","is_oa":true,"landing_page_url":"https://hdl.handle.net/2031/8731773b-4aeb-412e-9171-1b069515e135","pdf_url":null,"source":{"id":"https://openalex.org/S7407055387","display_name":"CityU Scholars","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Wei, M, Chow, T W S & Chan, R H M 2015, 'Clustering Heterogeneous Data with k-Means by Mutual Information-Based Unsupervised Feature Transformation', Entropy, vol. 17, no. 3, pp. 1535 - 1548. https://doi.org/10.3390/e17031535","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.3390/e17031535","is_oa":true,"landing_page_url":"https://doi.org/10.3390/e17031535","pdf_url":"https://www.mdpi.com/1099-4300/17/3/1535/pdf?version=1427106763","source":{"id":"https://openalex.org/S195231649","display_name":"Entropy","issn_l":"1099-4300","issn":["1099-4300"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Entropy","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309893","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23"},{"id":"https://openalex.org/F4320320904","display_name":"Croucher Foundation","ror":"https://ror.org/04741mc34"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2082888943.pdf","grobid_xml":"https://content.openalex.org/works/W2082888943.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W114704759","https://openalex.org/W1526441817","https://openalex.org/W1967987265","https://openalex.org/W1972532012","https://openalex.org/W1974209792","https://openalex.org/W1988387273","https://openalex.org/W1992402718","https://openalex.org/W1996344812","https://openalex.org/W1999071271","https://openalex.org/W2034182200","https://openalex.org/W2073459066","https://openalex.org/W2076331049","https://openalex.org/W2094014879","https://openalex.org/W2095897464","https://openalex.org/W2109622481","https://openalex.org/W2122943553","https://openalex.org/W2127218421","https://openalex.org/W2127971792","https://openalex.org/W2131687179","https://openalex.org/W2144357229","https://openalex.org/W2149230623","https://openalex.org/W2162151748","https://openalex.org/W3120740533","https://openalex.org/W3121403162","https://openalex.org/W4234556776","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2788671511","https://openalex.org/W4200482842","https://openalex.org/W3208326136","https://openalex.org/W2406932278","https://openalex.org/W2045437074","https://openalex.org/W2546959060","https://openalex.org/W2018402912","https://openalex.org/W2032989665","https://openalex.org/W4226101389","https://openalex.org/W2773760320"],"abstract_inverted_index":{"Traditional":[0],"centroid-based":[1],"clustering":[2,127],"algorithms":[3],"for":[4,26,82,131],"heterogeneous":[5,83,132],"data":[6,84,133],"with":[7,77,134],"numerical":[8,70,94,136],"and":[9,40,50,105,117,137],"non-numerical":[10,30,67,89,103,138],"features":[11,68,71,104],"result":[12],"in":[13],"different":[14,38],"levels":[15],"of":[16,29,100,109,119],"inaccurate":[17],"clustering.":[18,85],"This":[19],"is":[20],"because":[21],"the":[22,47,56,78,87,98,101,107,113,124],"Hamming":[23,51],"distance":[24,49],"used":[25],"dissimilarity":[27],"measurement":[28],"values":[31,95,111],"does":[32],"not":[33],"provide":[34,93],"optimal":[35],"distances":[36],"between":[37],"values,":[39],"problems":[41],"arise":[42],"from":[43],"attempts":[44],"to":[45],"combine":[46],"Euclidean":[48],"distance.":[52],"In":[53],"this":[54],"study,":[55],"mutual":[57],"information":[58,73],"(MI)-based":[59],"unsupervised":[60],"feature":[61],"transformation":[62],"(UFT),":[63],"which":[64,96],"can":[65,92],"transform":[66],"into":[69],"without":[72],"loss,":[74],"was":[75],"utilized":[76],"conventional":[79],"k-means":[80],"algorithm":[81,128],"For":[86],"original":[88,102],"features,":[90],"UFT":[91],"preserve":[97],"structure":[99],"have":[106],"property":[108],"continuous":[110],"at":[112],"same":[114],"time.":[115],"Experiments":[116],"analysis":[118],"real-world":[120],"datasets":[121],"showed":[122],"that,":[123],"integrated":[125],"UFT-k-means":[126],"outperformed":[129],"others":[130],"both":[135],"features.":[139]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2025-10-10T00:00:00"}
