{"id":"https://openalex.org/W1972132022","doi":"https://doi.org/10.1145/1046456.1046468","title":"Subspace clustering for high dimensional categorical data","display_name":"Subspace clustering for high dimensional categorical data","publication_year":2004,"publication_date":"2004-12-01","ids":{"openalex":"https://openalex.org/W1972132022","doi":"https://doi.org/10.1145/1046456.1046468","mag":"1972132022"},"language":"en","primary_location":{"id":"doi:10.1145/1046456.1046468","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1046456.1046468","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000062069","display_name":"Guojun Gan","orcid":"https://orcid.org/0000-0003-3285-7116"},"institutions":[{"id":"https://openalex.org/I192455969","display_name":"York University","ror":"https://ror.org/05fq50484","country_code":"CA","type":"education","lineage":["https://openalex.org/I192455969"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Guojun Gan","raw_affiliation_strings":["York University, Toronto, Canada","York University, Toronto,Canada#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"York University, Toronto, Canada","institution_ids":["https://openalex.org/I192455969"]},{"raw_affiliation_string":"York University, Toronto,Canada#TAB#","institution_ids":["https://openalex.org/I192455969"]}]},{"author_position":"last","author":{"id":null,"display_name":"Jianhong Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I192455969","display_name":"York University","ror":"https://ror.org/05fq50484","country_code":"CA","type":"education","lineage":["https://openalex.org/I192455969"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jianhong Wu","raw_affiliation_strings":["York University, Toronto, Canada","York University, Toronto,Canada#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"York University, Toronto, Canada","institution_ids":["https://openalex.org/I192455969"]},{"raw_affiliation_string":"York University, Toronto,Canada#TAB#","institution_ids":["https://openalex.org/I192455969"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.5513,"has_fulltext":false,"cited_by_count":73,"citation_normalized_percentile":{"value":0.95519558,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"6","issue":"2","first_page":"87","last_page":"94"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8456571102142334},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.727140486240387},{"id":"https://openalex.org/keywords/clustering-high-dimensional-data","display_name":"Clustering high-dimensional data","score":0.7081475257873535},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.6406171917915344},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.5715830326080322},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.5563536882400513},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5539290308952332},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.5322152376174927},{"id":"https://openalex.org/keywords/canopy-clustering-algorithm","display_name":"Canopy clustering algorithm","score":0.5014512538909912},{"id":"https://openalex.org/keywords/data-stream-clustering","display_name":"Data stream clustering","score":0.4590934216976166},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.424740731716156},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.39424675703048706},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37214282155036926},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33687666058540344},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.204138845205307}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8456571102142334},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.727140486240387},{"id":"https://openalex.org/C184509293","wikidata":"https://www.wikidata.org/wiki/Q5136711","display_name":"Clustering high-dimensional data","level":3,"score":0.7081475257873535},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.6406171917915344},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.5715830326080322},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.5563536882400513},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5539290308952332},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.5322152376174927},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.5014512538909912},{"id":"https://openalex.org/C193143536","wikidata":"https://www.wikidata.org/wiki/Q5227360","display_name":"Data stream clustering","level":5,"score":0.4590934216976166},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.424740731716156},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39424675703048706},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37214282155036926},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33687666058540344},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.204138845205307},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1046456.1046468","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1046456.1046468","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.108.5225","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.108.5225","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.sigkdd.org/explorations/issues/6-2-2004-12/gan.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1493454437","https://openalex.org/W1592068762","https://openalex.org/W1611682757","https://openalex.org/W1672197616","https://openalex.org/W1971784203","https://openalex.org/W1977496278","https://openalex.org/W1995433152","https://openalex.org/W1999668761","https://openalex.org/W2027002571","https://openalex.org/W2034870679","https://openalex.org/W2042035594","https://openalex.org/W2065811242","https://openalex.org/W2072343647","https://openalex.org/W2080816440","https://openalex.org/W2084812512","https://openalex.org/W2105518356","https://openalex.org/W2112210867","https://openalex.org/W2115116401","https://openalex.org/W2115875363","https://openalex.org/W2118587067","https://openalex.org/W2119885577","https://openalex.org/W2125310307","https://openalex.org/W2131687179","https://openalex.org/W2149230623","https://openalex.org/W2157890661","https://openalex.org/W2212819718","https://openalex.org/W2295428206","https://openalex.org/W2319660501","https://openalex.org/W2505879829","https://openalex.org/W2999729612","https://openalex.org/W4244268470","https://openalex.org/W4254311734","https://openalex.org/W4255446233","https://openalex.org/W6636657728","https://openalex.org/W6677796945","https://openalex.org/W6770641979"],"related_works":["https://openalex.org/W4301002638","https://openalex.org/W2371010743","https://openalex.org/W2163563073","https://openalex.org/W3088133960","https://openalex.org/W1987613674","https://openalex.org/W3186815950","https://openalex.org/W4253632195","https://openalex.org/W2393707058","https://openalex.org/W2590117803","https://openalex.org/W3124860551"],"abstract_inverted_index":{"Data":[0],"clustering":[1,11,32,53],"has":[2],"been":[3],"discussed":[4],"extensively,":[5],"but":[6],"almost":[7],"all":[8],"known":[9],"conventional":[10],"algorithms":[12,33],"tend":[13],"to":[14,86,107,112,126],"break":[15],"down":[16],"in":[17],"high":[18,54],"dimensional":[19,55],"spaces":[20],"because":[21],"of":[22,26,63,98,130],"the":[23,27,61,77,88,114,128,131,135],"inherent":[24],"sparsity":[25],"data":[28,37,57],"points.":[29],"Existing":[30],"subspace":[31,89,115],"for":[34,52,67,105],"handling":[35],"high-dimensional":[36],"focus":[38],"on":[39,60],"numerical":[40],"dimensions.":[41],"In":[42],"this":[43,99],"paper,":[44],"we":[45,121],"designed":[46,82],"an":[47,64,83],"iterative":[48],"algorithm":[49,111],"called":[50],"SUBCAD":[51],"categorical":[56],"sets,":[58],"based":[59],"minimization":[62],"objective":[65,78,84,100],"function":[66,85,101],"clustering.":[68],"We":[69,80,94],"deduced":[70],"some":[71,124],"cluster":[72],"memberships":[73],"changing":[74],"rules":[75],"using":[76],"function.":[79],"also":[81],"determine":[87],"associated":[90,116],"with":[91,117],"each":[92,118],"cluster.":[93,119],"proved":[95],"various":[96],"properties":[97],"that":[102],"are":[103],"essential":[104],"us":[106],"design":[108],"a":[109],"fast":[110],"find":[113],"Finally,":[120],"carried":[122],"out":[123],"experiments":[125],"show":[127],"effectiveness":[129],"proposed":[132],"method":[133],"and":[134],"algorithm.":[136]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":8},{"year":2014,"cited_by_count":9},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
