{"id":"https://openalex.org/W2965184183","doi":"https://doi.org/10.26599/bdma.2018.9020037","title":"A novel clustering technique for efficient clustering of big data in Hadoop Ecosystem","display_name":"A novel clustering technique for efficient clustering of big data in Hadoop Ecosystem","publication_year":2019,"publication_date":"2019-08-05","ids":{"openalex":"https://openalex.org/W2965184183","doi":"https://doi.org/10.26599/bdma.2018.9020037","mag":"2965184183"},"language":"en","primary_location":{"id":"doi:10.26599/bdma.2018.9020037","is_oa":true,"landing_page_url":"https://doi.org/10.26599/bdma.2018.9020037","pdf_url":"https://ieeexplore.ieee.org/ielx7/8254253/8787225/08787229.pdf","source":{"id":"https://openalex.org/S4210209060","display_name":"Big Data Mining and Analytics","issn_l":"2096-0654","issn":["2096-0654"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311901","host_organization_name":"Tsinghua University Press","host_organization_lineage":["https://openalex.org/P4310311901"],"host_organization_lineage_names":["Tsinghua University Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data Mining and Analytics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ieeexplore.ieee.org/ielx7/8254253/8787225/08787229.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073624587","display_name":"Sunil Kumar","orcid":"https://orcid.org/0000-0002-9778-6550"},"institutions":[{"id":"https://openalex.org/I223471776","display_name":"Guru Angad Dev Veterinary and Animal Sciences University","ror":"https://ror.org/00bbeqy02","country_code":"IN","type":"education","lineage":["https://openalex.org/I223471776"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Sunil Kumar","raw_affiliation_strings":["Directorate of Livestock Farms, Guru Angad Dev Veterinary and Animal Sciences University, Ludhiana 141001, India"],"affiliations":[{"raw_affiliation_string":"Directorate of Livestock Farms, Guru Angad Dev Veterinary and Animal Sciences University, Ludhiana 141001, India","institution_ids":["https://openalex.org/I223471776"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086900671","display_name":"Maninder Singh","orcid":"https://orcid.org/0000-0001-8489-8759"},"institutions":[{"id":"https://openalex.org/I79161377","display_name":"Punjabi University","ror":"https://ror.org/00xdn8y92","country_code":"IN","type":"education","lineage":["https://openalex.org/I79161377"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Maninder Singh","raw_affiliation_strings":["Department of Computer Science, Punjabi University, Punjab 147002, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Punjabi University, Punjab 147002, India","institution_ids":["https://openalex.org/I79161377"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5073624587"],"corresponding_institution_ids":["https://openalex.org/I223471776"],"apc_list":null,"apc_paid":null,"fwci":4.0605,"has_fulltext":true,"cited_by_count":46,"citation_normalized_percentile":{"value":0.951541,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"2","issue":"4","first_page":"240","last_page":"247"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.8733999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.8733999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13731","display_name":"Advanced Computing and Algorithms","score":0.7713000178337097,"subfield":{"id":"https://openalex.org/subfields/3322","display_name":"Urban Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.7584999799728394,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8611705899238586},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7925092577934265},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.7434622049331665},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.7056968808174133},{"id":"https://openalex.org/keywords/canopy-clustering-algorithm","display_name":"Canopy clustering algorithm","score":0.6391164064407349},{"id":"https://openalex.org/keywords/data-stream-clustering","display_name":"Data stream clustering","score":0.6255385875701904},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.5559492111206055},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5512762665748596},{"id":"https://openalex.org/keywords/fuzzy-clustering","display_name":"Fuzzy clustering","score":0.4732794463634491},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.47174322605133057},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.42009374499320984},{"id":"https://openalex.org/keywords/clustering-high-dimensional-data","display_name":"Clustering high-dimensional data","score":0.4119982123374939},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2807224988937378},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12198615074157715}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8611705899238586},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7925092577934265},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.7434622049331665},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.7056968808174133},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.6391164064407349},{"id":"https://openalex.org/C193143536","wikidata":"https://www.wikidata.org/wiki/Q5227360","display_name":"Data stream clustering","level":5,"score":0.6255385875701904},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.5559492111206055},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5512762665748596},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.4732794463634491},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.47174322605133057},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.42009374499320984},{"id":"https://openalex.org/C184509293","wikidata":"https://www.wikidata.org/wiki/Q5136711","display_name":"Clustering high-dimensional data","level":3,"score":0.4119982123374939},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2807224988937378},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12198615074157715}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.26599/bdma.2018.9020037","is_oa":true,"landing_page_url":"https://doi.org/10.26599/bdma.2018.9020037","pdf_url":"https://ieeexplore.ieee.org/ielx7/8254253/8787225/08787229.pdf","source":{"id":"https://openalex.org/S4210209060","display_name":"Big Data Mining and Analytics","issn_l":"2096-0654","issn":["2096-0654"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311901","host_organization_name":"Tsinghua University Press","host_organization_lineage":["https://openalex.org/P4310311901"],"host_organization_lineage_names":["Tsinghua University Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data Mining and Analytics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:6a34f9e29dcc4346940cc11b16c94363","is_oa":true,"landing_page_url":"https://doaj.org/article/6a34f9e29dcc4346940cc11b16c94363","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Big Data Mining and Analytics, Vol 2, Iss 4, Pp 240-247 (2019)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.26599/bdma.2018.9020037","is_oa":true,"landing_page_url":"https://doi.org/10.26599/bdma.2018.9020037","pdf_url":"https://ieeexplore.ieee.org/ielx7/8254253/8787225/08787229.pdf","source":{"id":"https://openalex.org/S4210209060","display_name":"Big Data Mining and Analytics","issn_l":"2096-0654","issn":["2096-0654"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311901","host_organization_name":"Tsinghua University Press","host_organization_lineage":["https://openalex.org/P4310311901"],"host_organization_lineage_names":["Tsinghua University Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data Mining and Analytics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Life in Land","score":0.5,"id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2965184183.pdf","grobid_xml":"https://content.openalex.org/works/W2965184183.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W40976687","https://openalex.org/W176412762","https://openalex.org/W316408160","https://openalex.org/W1503321541","https://openalex.org/W1860789530","https://openalex.org/W1967368946","https://openalex.org/W1975827585","https://openalex.org/W1988711335","https://openalex.org/W2009728897","https://openalex.org/W2050802111","https://openalex.org/W2055533652","https://openalex.org/W2057923756","https://openalex.org/W2095178814","https://openalex.org/W2101228436","https://openalex.org/W2109574129","https://openalex.org/W2120751691","https://openalex.org/W2121784101","https://openalex.org/W2126626732","https://openalex.org/W2161160262","https://openalex.org/W2247765268","https://openalex.org/W2261525379","https://openalex.org/W2553163363"],"related_works":["https://openalex.org/W4301002638","https://openalex.org/W2371010743","https://openalex.org/W2163563073","https://openalex.org/W3088133960","https://openalex.org/W1987613674","https://openalex.org/W3186815950","https://openalex.org/W4253632195","https://openalex.org/W2393707058","https://openalex.org/W3168768270","https://openalex.org/W2590117803"],"abstract_inverted_index":{"Big":[0],"data":[1,4,11,29,32,42,47,51],"analytics":[2],"and":[3,12,21,35,54,71,95,141,161,166],"mining":[5,43],"are":[6,73],"techniques":[7],"used":[8],"to":[9,13,19,58,91,115],"analyze":[10],"extract":[14,59],"hidden":[15],"information.":[16],"Traditional":[17],"approaches":[18],"analysis":[20],"extraction":[22],"do":[23],"not":[24,74],"work":[25],"well":[26],"for":[27],"big":[28],"because":[30],"this":[31,101],"is":[33,84,88,150,158],"complex":[34],"of":[36,79,119,135,143],"very":[37],"high":[38],"volume.":[39],"A":[40],"major":[41],"technique":[44],"known":[45],"as":[46,69,76],"clustering":[48,66,98,108,112,121,156],"groups":[49],"the":[50,77,80,117,125,133,146,153],"into":[52],"clusters":[53,81],"makes":[55],"it":[56,149],"easy":[57],"information":[60],"from":[61],"these":[62],"clusters.":[63],"However,":[64],"existing":[65,120,130],"algorithms,":[67],"such":[68],"k-means":[70],"hierarchical,":[72],"efficient":[75,94],"quality":[78],"they":[82],"produce":[83],"compromised.":[85],"Therefore,":[86],"there":[87],"a":[89,106],"need":[90],"design":[92],"an":[93],"highly":[96],"scalable":[97],"algorithm.":[99],"In":[100],"paper,":[102],"we":[103],"put":[104],"forward":[105],"new":[107,126],"algorithm":[109,128,157],"called":[110],"hybrid":[111,127,155],"in":[113],"order":[114],"overcome":[116],"disadvantages":[118],"algorithms.":[122],"We":[123],"compare":[124],"with":[129],"algorithms":[131],"on":[132],"bases":[134],"precision,":[136,164],"recall,":[137,165],"F-measure,":[138],"execution":[139],"time,":[140],"accuracy":[142],"results.":[144],"From":[145],"experimental":[147],"results,":[148],"clear":[151],"that":[152],"proposed":[154],"more":[159],"accurate,":[160],"has":[162],"better":[163],"F-measure":[167],"values.":[168]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
