{"id":"https://openalex.org/W2149373142","doi":"https://doi.org/10.1186/s40537-015-0027-y","title":"A novel algorithm for fast and scalable subspace clustering of high-dimensional data","display_name":"A novel algorithm for fast and scalable subspace clustering of high-dimensional data","publication_year":2015,"publication_date":"2015-08-11","ids":{"openalex":"https://openalex.org/W2149373142","doi":"https://doi.org/10.1186/s40537-015-0027-y","mag":"2149373142"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-015-0027-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0027-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-015-0027-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-015-0027-y","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101549768","display_name":"Amardeep Kaur","orcid":"https://orcid.org/0000-0002-0317-5303"},"institutions":[{"id":"https://openalex.org/I177877127","display_name":"The University of Western Australia","ror":"https://ror.org/047272k79","country_code":"AU","type":"education","lineage":["https://openalex.org/I177877127"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Amardeep Kaur","raw_affiliation_strings":["School of Computer Science and Software Engineering, University of Western Australia, Stirling Highway, 6009, Perth, Australia"],"raw_orcid":"https://orcid.org/0000-0002-0317-5303","affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, University of Western Australia, Stirling Highway, 6009, Perth, Australia","institution_ids":["https://openalex.org/I177877127"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005705210","display_name":"Amitava Datta","orcid":"https://orcid.org/0000-0001-6916-7907"},"institutions":[{"id":"https://openalex.org/I177877127","display_name":"The University of Western Australia","ror":"https://ror.org/047272k79","country_code":"AU","type":"education","lineage":["https://openalex.org/I177877127"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Amitava Datta","raw_affiliation_strings":["School of Computer Science and Software Engineering, University of Western Australia, Stirling Highway, 6009, Perth, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, University of Western Australia, Stirling Highway, 6009, Perth, Australia","institution_ids":["https://openalex.org/I177877127"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101549768"],"corresponding_institution_ids":["https://openalex.org/I177877127"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":6.677,"has_fulltext":true,"cited_by_count":39,"citation_normalized_percentile":{"value":0.96744312,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"2","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8362753391265869},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7413142323493958},{"id":"https://openalex.org/keywords/linear-subspace","display_name":"Linear subspace","score":0.7353991866111755},{"id":"https://openalex.org/keywords/clustering-high-dimensional-data","display_name":"Clustering high-dimensional data","score":0.7181884050369263},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6100406050682068},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6059072017669678},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.603799045085907},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.5945252776145935},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.49761584401130676},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.4644038677215576},{"id":"https://openalex.org/keywords/data-point","display_name":"Data point","score":0.43426191806793213},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.433065265417099},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.42254793643951416},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.41127318143844604},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4022625684738159},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34993964433670044},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19474530220031738},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.1637800633907318}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8362753391265869},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7413142323493958},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.7353991866111755},{"id":"https://openalex.org/C184509293","wikidata":"https://www.wikidata.org/wiki/Q5136711","display_name":"Clustering high-dimensional data","level":3,"score":0.7181884050369263},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6100406050682068},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6059072017669678},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.603799045085907},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.5945252776145935},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.49761584401130676},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.4644038677215576},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.43426191806793213},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.433065265417099},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.42254793643951416},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41127318143844604},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4022625684738159},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34993964433670044},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19474530220031738},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.1637800633907318},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1186/s40537-015-0027-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0027-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-015-0027-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:openaire/569403ea-4587-42f3-bb5d-95cfc17817ec","is_oa":true,"landing_page_url":"https://admin.research-repository.uwa.edu.au/en/publications/569403ea-4587-42f3-bb5d-95cfc17817ec","pdf_url":null,"source":{"id":"https://openalex.org/S4306402492","display_name":"UWA Profiles and Research Repository (UWA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I177877127","host_organization_name":"The University of Western Australia","host_organization_lineage":["https://openalex.org/I177877127"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kaur, A & Datta, A 2015, 'A novel algorithm for fast and scalable subspace clustering of high-dimensional data', Journal of Big Data, vol. 2, no. 17, pp. 1-24. https://doi.org/10.1186/s40537-015-0027-y","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.atira.dk:publications/569403ea-4587-42f3-bb5d-95cfc17817ec","is_oa":true,"landing_page_url":"https://research-repository.uwa.edu.au/en/publications/569403ea-4587-42f3-bb5d-95cfc17817ec","pdf_url":null,"source":{"id":"https://openalex.org/S4306402523","display_name":"UWA Profiles and Research Repository (University of Western Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I177877127","host_organization_name":"The University of Western Australia","host_organization_lineage":["https://openalex.org/I177877127"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Kaur , A &amp; Datta , A 2015 , ' A novel algorithm for fast and scalable subspace clustering of high-dimensional data ' , Journal of Big Data , vol. 2 , no. 17 , pp. 1-24 . https://doi.org/10.1186/s40537-015-0027-y","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-015-0027-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0027-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-015-0027-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320315885","display_name":"Australian Government","ror":"https://ror.org/0314h5y94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2149373142.pdf","grobid_xml":"https://content.openalex.org/works/W2149373142.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W180521011","https://openalex.org/W191006456","https://openalex.org/W1493217831","https://openalex.org/W1507901999","https://openalex.org/W1531910981","https://openalex.org/W1550603695","https://openalex.org/W1553696291","https://openalex.org/W1562753845","https://openalex.org/W1599794708","https://openalex.org/W1672197616","https://openalex.org/W1673310716","https://openalex.org/W1968201280","https://openalex.org/W1977496278","https://openalex.org/W1979538862","https://openalex.org/W1993962865","https://openalex.org/W1999705173","https://openalex.org/W2005799462","https://openalex.org/W2006533296","https://openalex.org/W2042035594","https://openalex.org/W2056639756","https://openalex.org/W2065811242","https://openalex.org/W2079361215","https://openalex.org/W2080816440","https://openalex.org/W2095897464","https://openalex.org/W2101234009","https://openalex.org/W2105877777","https://openalex.org/W2109130989","https://openalex.org/W2109464129","https://openalex.org/W2109746343","https://openalex.org/W2114060717","https://openalex.org/W2115579991","https://openalex.org/W2116324873","https://openalex.org/W2116838486","https://openalex.org/W2117355841","https://openalex.org/W2118258530","https://openalex.org/W2125742596","https://openalex.org/W2133990480","https://openalex.org/W2138745909","https://openalex.org/W2140942285","https://openalex.org/W2141012957","https://openalex.org/W2150926065","https://openalex.org/W2153233077","https://openalex.org/W2155010807","https://openalex.org/W2159633885","https://openalex.org/W2165916500","https://openalex.org/W2167091752","https://openalex.org/W2169387435","https://openalex.org/W2171029115","https://openalex.org/W2188351697","https://openalex.org/W2189948602","https://openalex.org/W2230939080","https://openalex.org/W2294644361","https://openalex.org/W2500846359","https://openalex.org/W2549056440","https://openalex.org/W3120740533","https://openalex.org/W4213009331","https://openalex.org/W4237171445","https://openalex.org/W4248058040","https://openalex.org/W4250446904","https://openalex.org/W4250657332","https://openalex.org/W4254311734","https://openalex.org/W4285719527","https://openalex.org/W6600686112"],"related_works":["https://openalex.org/W4301002638","https://openalex.org/W2606552659","https://openalex.org/W2111119584","https://openalex.org/W3186815950","https://openalex.org/W3088133960","https://openalex.org/W2163563073","https://openalex.org/W2921708367","https://openalex.org/W2001483765","https://openalex.org/W2590117803","https://openalex.org/W2607902515"],"abstract_inverted_index":{"Rapid":[0],"growth":[1,91],"of":[2,24,28,35,40,65,95,101,107,167,183,186,198,248,259],"high":[3,47],"dimensional":[4,48,152,158],"datasets":[5,49],"in":[6,32,45,80,92,125,180,266],"recent":[7],"years":[8],"has":[9],"created":[10],"an":[11,51],"emergent":[12],"need":[13],"to":[14,147,220],"extract":[15],"the":[16,22,33,36,46,89,93,99,104,156,165,168,178,181,207,246,249,257,260],"knowledge":[17],"underlying":[18],"them.":[19],"Clustering":[20],"is":[21,50,114,143,252],"process":[23,84,106],"automatically":[25],"finding":[26],"groups":[27],"similar":[29],"data":[30,55,102,128,238],"points":[31],"space":[34],"dimensions":[37],"or":[38,204],"attributes":[39],"a":[41,71,83,115,144,161,195,216,236],"dataset.":[42],"Finding":[43],"clusters":[44,154,159,224],"important":[52],"and":[53,120,136,193,228,251,263],"challenging":[54],"mining":[56],"problem.":[57],"Data":[58],"group":[59],"together":[60],"differently":[61],"under":[62],"different":[63],"subsets":[64],"dimensions,":[66],"called":[67,85],"subspaces.":[68],"Quite":[69],"often":[70],"dataset":[72,250],"can":[73],"be":[74],"better":[75],"understood":[76],"by":[77],"clustering":[78,109,123,142,208,218],"it":[79,229],"its":[81,264],"subspaces,":[82],"subspace":[86,108,122,153,200,223],"clustering.":[87],"But":[88],"exponential":[90],"number":[94,182,197],"these":[96,187],"subspaces":[97],"with":[98,177,225,245],"dimensionality":[100,247],"makes":[103],"whole":[105],"computationally":[110],"very":[111,243],"expensive.":[112],"There":[113],"growing":[116],"demand":[117],"for":[118,235],"efficient":[119],"scalable":[121],"solutions":[124],"many":[126],"Big":[127],"application":[129],"domains":[130],"like":[131],"biology,":[132],"computer":[133],"vision,":[134],"astronomy":[135],"social":[137],"networking.":[138],"Apriori":[139],"based":[140,171],"hierarchical":[141],"promising":[145],"approach":[146,174],"find":[148,221],"all":[149],"possible":[150],"higher":[151],"from":[155],"lower":[157],"using":[160],"bottom-up":[162],"process.":[163,209],"However,":[164],"performance":[166],"existing":[169],"algorithms":[170,188],"on":[172],"this":[173,211,267],"deteriorates":[175],"drastically":[176],"increase":[179],"dimensions.":[184],"Most":[185],"require":[189],"multiple":[190],"database":[191,233],"scans":[192,234],"generate":[194],"large":[196],"redundant":[199],"clusters,":[201],"either":[202],"implicitly":[203],"explicitly,":[205],"during":[206],"In":[210],"paper,":[212],"we":[213],"present":[214,256],"SUBSCALE,":[215],"novel":[217],"algorithm":[219,241,262],"non-trivial":[222],"minimal":[226],"cost":[227],"requires":[230],"only":[231],"k":[232],"k-dimensional":[237],"set.":[239],"Our":[240],"scales":[242],"well":[244],"highly":[253],"parallelizable.":[254],"We":[255],"details":[258],"SUBSCALE":[261],"evaluation":[265],"paper.":[268]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
