{"id":"https://openalex.org/W2520037496","doi":"https://doi.org/10.1109/tkde.2016.2609423","title":"Efficient Distributed Density Peaks for Clustering Large Data Sets in MapReduce","display_name":"Efficient Distributed Density Peaks for Clustering Large Data Sets in MapReduce","publication_year":2016,"publication_date":"2016-09-14","ids":{"openalex":"https://openalex.org/W2520037496","doi":"https://doi.org/10.1109/tkde.2016.2609423","mag":"2520037496"},"language":"en","primary_location":{"id":"doi:10.1109/tkde.2016.2609423","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2016.2609423","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100367496","display_name":"Yanfeng Zhang","orcid":"https://orcid.org/0000-0002-9871-0304"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanfeng Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101499113","display_name":"Shimin Chen","orcid":"https://orcid.org/0009-0000-1043-6236"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shimin Chen","raw_affiliation_strings":["State Key Laboratory of Computer Architecture, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Computer Architecture, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072406974","display_name":"Ge Yu","orcid":"https://orcid.org/0000-0002-3171-8889"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Yu","raw_affiliation_strings":["School of Computer Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100367496"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":3.7166,"has_fulltext":false,"cited_by_count":63,"citation_normalized_percentile":{"value":0.95673156,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"28","issue":"12","first_page":"3218","last_page":"3230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.822216272354126},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7653490304946899},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7377896308898926},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7284796237945557},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6355359554290771},{"id":"https://openalex.org/keywords/locality-sensitive-hashing","display_name":"Locality-sensitive hashing","score":0.5601903796195984},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5494527220726013},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5334266424179077},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49612435698509216},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4508315622806549},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.43686509132385254},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34485486149787903},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2953428626060486},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.10908165574073792}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.822216272354126},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7653490304946899},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7377896308898926},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7284796237945557},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6355359554290771},{"id":"https://openalex.org/C74270461","wikidata":"https://www.wikidata.org/wiki/Q1625299","display_name":"Locality-sensitive hashing","level":4,"score":0.5601903796195984},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5494527220726013},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5334266424179077},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49612435698509216},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4508315622806549},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.43686509132385254},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34485486149787903},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2953428626060486},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.10908165574073792},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tkde.2016.2609423","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2016.2609423","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G139175041","display_name":null,"funder_award_id":"N141605001","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G2272985169","display_name":null,"funder_award_id":"61300023","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3875971815","display_name":null,"funder_award_id":"61572468","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4006564843","display_name":null,"funder_award_id":"61433008","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5574275911","display_name":null,"funder_award_id":"61672141","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7890275306","display_name":null,"funder_award_id":"61528203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8380396287","display_name":null,"funder_award_id":"61521092","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W105622892","https://openalex.org/W177602031","https://openalex.org/W185144071","https://openalex.org/W596485744","https://openalex.org/W795388544","https://openalex.org/W1502916507","https://openalex.org/W1535532259","https://openalex.org/W1564609383","https://openalex.org/W1673310716","https://openalex.org/W1754357762","https://openalex.org/W1967275758","https://openalex.org/W1976861199","https://openalex.org/W1980771692","https://openalex.org/W1992677509","https://openalex.org/W2040574519","https://openalex.org/W2049003051","https://openalex.org/W2049633694","https://openalex.org/W2071218392","https://openalex.org/W2111887504","https://openalex.org/W2119885577","https://openalex.org/W2126154518","https://openalex.org/W2126399065","https://openalex.org/W2147347448","https://openalex.org/W2147717514","https://openalex.org/W2150593711","https://openalex.org/W2153622543","https://openalex.org/W2154879298","https://openalex.org/W2155502235","https://openalex.org/W2160064536","https://openalex.org/W2162006472","https://openalex.org/W2162866953","https://openalex.org/W2165835468","https://openalex.org/W2170037597","https://openalex.org/W2337492206","https://openalex.org/W2799047321","https://openalex.org/W2999729612","https://openalex.org/W3007826101","https://openalex.org/W3098238967","https://openalex.org/W4205637966","https://openalex.org/W4300988640","https://openalex.org/W6604221439","https://openalex.org/W6607280872","https://openalex.org/W6617955183","https://openalex.org/W6629956336","https://openalex.org/W6633903505","https://openalex.org/W6638047745","https://openalex.org/W6685012337","https://openalex.org/W6891775057"],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W98480971","https://openalex.org/W2150291671","https://openalex.org/W2027972911","https://openalex.org/W2146343568","https://openalex.org/W2013643406","https://openalex.org/W2144265691","https://openalex.org/W2033383639","https://openalex.org/W3108918257"],"abstract_inverted_index":{"Density":[0],"Peaks":[1],"(DP)":[2],"is":[3,46],"a":[4,23,66,165,174,217],"recently":[5],"proposed":[6],"clustering":[7,15],"algorithm":[8,83],"that":[9,65,84,124,145,171],"has":[10,18,71,204],"distinctive":[11],"advantages":[12],"over":[13,179,186],"existing":[14],"algorithms.":[16],"It":[17],"already":[19],"been":[20],"used":[21],"in":[22,108,134],"wide":[24],"range":[25],"of":[26,37,117,126,141,159,176],"applications.":[27],"However,":[28],"DP":[29,118],"requires":[30],"computing":[31],"the":[32,101,115,122,127,146,150,157,180,187,198],"distance":[33],"between":[34],"every":[35],"pair":[36],"input":[38],"points,":[39],"therefore":[40],"incurring":[41],"quadratic":[42],"computation":[43,75],"overhead,":[44],"which":[45],"prohibitive":[47],"for":[48,60,89,111],"large":[49],"data":[50],"sets.":[51],"In":[52],"this":[53],"paper,":[54],"we":[55,78],"study":[56],"efficient":[57],"distributed":[58],"algorithms":[59],"DP.":[61,112],"We":[62,104,113,137],"first":[63],"show":[64,144,170],"naive":[67,181],"MapReduce":[68],"solution":[69],"(Basic-DDP)":[70],"high":[72],"communication":[73],"and":[74,95,143,149,168,183],"overhead.":[76],"Then,":[77],"propose":[79],"LSH-DDP,":[80,142],"an":[81],"approximate":[82,100],"exploits":[85],"Locality":[86],"Sensitive":[87],"Hashing":[88],"partitioning":[90],"data,":[91],"performs":[92],"local":[93,97,135,166],"computation,":[94],"aggregates":[96],"results":[98,162],"to":[99,119,197],"final":[102],"results.":[103,195],"address":[105],"several":[106],"challenges":[107],"employing":[109],"LSH":[110],"leverage":[114],"characteristics":[116],"deal":[120],"with":[121,216],"fact":[123],"some":[125],"result":[128],"values":[129],"cannot":[130],"be":[131,153],"directly":[132],"approximated":[133],"partitions.":[136],"present":[138],"formal":[139],"analysis":[140],"approximation":[147],"quality":[148],"runtime":[151],"can":[152],"controlled":[154],"by":[155],"tuning":[156],"parameters":[158],"LSH-DDP.":[160],"Experimental":[161],"on":[163],"both":[164],"cluster":[167,194],"EC2":[169],"LSH-DDP":[172,202,210],"achieves":[173],"factor":[175],"1.7-70x":[177],"speedup":[178,185],"Basic-DDP":[182],"2x":[184],"state-of-the-art":[188],"EDDPC":[189],"approach,":[190],"while":[191],"returning":[192],"comparable":[193,205],"Compared":[196],"popular":[199],"K-means":[200],"clustering,":[201],"also":[203],"or":[206],"better":[207],"performance.":[208],"Furthermore,":[209],"could":[211],"achieve":[212],"even":[213],"higher":[214],"efficiency":[215],"lower":[218],"accuracy":[219],"requirement.":[220]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":10},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":8}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
