{"id":"https://openalex.org/W2055935910","doi":"https://doi.org/10.1145/1989323.1989399","title":"Local graph sparsification for scalable clustering","display_name":"Local graph sparsification for scalable clustering","publication_year":2011,"publication_date":"2011-06-12","ids":{"openalex":"https://openalex.org/W2055935910","doi":"https://doi.org/10.1145/1989323.1989399","mag":"2055935910"},"language":"en","primary_location":{"id":"doi:10.1145/1989323.1989399","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1989323.1989399","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2011 ACM SIGMOD International Conference on Management of data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070529813","display_name":"Venu Satuluri","orcid":null},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Venu Satuluri","raw_affiliation_strings":["The Ohio State University, Columbus, OH, USA","The Ohio State University, Columbus, OH, USA.;"],"affiliations":[{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]},{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA.;","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100755351","display_name":"Srinivasan Parthasarathy","orcid":"https://orcid.org/0000-0002-6062-6449"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Srinivasan Parthasarathy","raw_affiliation_strings":["The Ohio State University, Columbus, OH, USA","The Ohio State University, Columbus, OH, USA.;"],"affiliations":[{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]},{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA.;","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023312718","display_name":"Yiye Ruan","orcid":null},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiye Ruan","raw_affiliation_strings":["The Ohio State University, Columbus, OH, USA","The Ohio State University, Columbus, OH, USA.;"],"affiliations":[{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]},{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA.;","institution_ids":["https://openalex.org/I52357470"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5070529813"],"corresponding_institution_ids":["https://openalex.org/I52357470"],"apc_list":null,"apc_paid":null,"fwci":7.3979,"has_fulltext":false,"cited_by_count":167,"citation_normalized_percentile":{"value":0.97753057,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"721","last_page":"732"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7991101741790771},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7146013975143433},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6575846076011658},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5493615865707397},{"id":"https://openalex.org/keywords/clustering-coefficient","display_name":"Clustering coefficient","score":0.5057995319366455},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.4974499046802521},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4750245213508606},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4562474489212036},{"id":"https://openalex.org/keywords/single-linkage-clustering","display_name":"Single-linkage clustering","score":0.42502155900001526},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.3519596755504608},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33282628655433655},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.251200795173645}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7991101741790771},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7146013975143433},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6575846076011658},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5493615865707397},{"id":"https://openalex.org/C22047676","wikidata":"https://www.wikidata.org/wiki/Q898680","display_name":"Clustering coefficient","level":3,"score":0.5057995319366455},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.4974499046802521},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4750245213508606},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4562474489212036},{"id":"https://openalex.org/C22648726","wikidata":"https://www.wikidata.org/wiki/Q7523744","display_name":"Single-linkage clustering","level":5,"score":0.42502155900001526},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.3519596755504608},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33282628655433655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.251200795173645},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1989323.1989399","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1989323.1989399","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2011 ACM SIGMOD International Conference on Management of data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W139517508","https://openalex.org/W1549390321","https://openalex.org/W1581656968","https://openalex.org/W1588155622","https://openalex.org/W1601142477","https://openalex.org/W1604983895","https://openalex.org/W1978024959","https://openalex.org/W1991800036","https://openalex.org/W2000042664","https://openalex.org/W2023655578","https://openalex.org/W2045107949","https://openalex.org/W2051540665","https://openalex.org/W2068888615","https://openalex.org/W2070232376","https://openalex.org/W2086486316","https://openalex.org/W2094688862","https://openalex.org/W2095293504","https://openalex.org/W2101196063","https://openalex.org/W2102322109","https://openalex.org/W2107067224","https://openalex.org/W2107904695","https://openalex.org/W2112490961","https://openalex.org/W2115022330","https://openalex.org/W2121564430","https://openalex.org/W2121947440","https://openalex.org/W2125664420","https://openalex.org/W2127048411","https://openalex.org/W2131717044","https://openalex.org/W2133102806","https://openalex.org/W2135957668","https://openalex.org/W2137253512","https://openalex.org/W2146008005","https://openalex.org/W2148043260","https://openalex.org/W2149857793","https://openalex.org/W2164858177","https://openalex.org/W2171935404","https://openalex.org/W3102641634","https://openalex.org/W3103362336","https://openalex.org/W4233437719","https://openalex.org/W6676366283","https://openalex.org/W6680064377"],"related_works":["https://openalex.org/W2188840951","https://openalex.org/W4241767317","https://openalex.org/W2101637161","https://openalex.org/W2171610853","https://openalex.org/W2160785859","https://openalex.org/W1999117613","https://openalex.org/W2559422900","https://openalex.org/W3092684173","https://openalex.org/W2103650652","https://openalex.org/W1887359504"],"abstract_inverted_index":{"In":[0,138],"this":[1],"paper":[2],"we":[3,65,83],"look":[4],"at":[5,141],"how":[6,12],"to":[7,13,24,39,47,56,77,89],"sparsify":[8],"a":[9,60],"graph":[10,27,107],"i.e.":[11],"reduce":[14],"the":[15,19,42,51,70,74,78,85,93,123,132,135,145],"edgeset":[16],"while":[17],"keeping":[18],"nodes":[20,75],"intact,":[21],"so":[22],"as":[23],"enable":[25],"faster":[26],"clustering":[28,108,147,154],"without":[29],"sacrificing":[30],"quality.":[31],"The":[32],"main":[33],"idea":[34],"behind":[35],"our":[36,115,149],"approach":[37,117],"is":[38],"preferentially":[40],"retain":[41],"edges":[43,58,88],"that":[44,64,114],"are":[45],"likely":[46],"be":[48,90],"part":[49],"of":[50,73,134,144],"same":[52],"cluster.":[53],"We":[54],"propose":[55],"rank":[57],"using":[59,104],"simple":[61],"similarity-based":[62],"heuristic":[63],"efficiently":[66],"compute":[67],"by":[68],"comparing":[69],"minhash":[71],"signatures":[72],"incident":[76],"edge.":[79],"For":[80],"each":[81],"node,":[82],"select":[84],"top":[86],"few":[87],"retained":[91],"in":[92,122,131],"sparsified":[94],"graph.":[95],"Extensive":[96],"empirical":[97],"results":[98],"on":[99],"several":[100],"real":[101],"networks":[102],"and":[103,109],"four":[105,146],"state-of-the-art":[106],"community":[110],"discovery":[111],"algorithms":[112],"reveal":[113],"proposed":[116],"realizes":[118],"excellent":[119],"speedups":[120],"(often":[121],"range":[124],"10-50),":[125],"with":[126],"little":[127],"or":[128],"no":[129],"deterioration":[130],"quality":[133],"resulting":[136],"clusters.":[137],"fact,":[139],"for":[140],"least":[142],"two":[143],"algorithms,":[148],"sparsification":[150],"consistently":[151],"enables":[152],"higher":[153],"accuracies.":[155]},"counts_by_year":[{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":7},{"year":2017,"cited_by_count":13},{"year":2016,"cited_by_count":19},{"year":2015,"cited_by_count":20},{"year":2014,"cited_by_count":12},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":8}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
