{"id":"https://openalex.org/W2120263102","doi":"https://doi.org/10.1145/1142351.1142374","title":"Achieving anonymity via clustering","display_name":"Achieving anonymity via clustering","publication_year":2006,"publication_date":"2006-06-26","ids":{"openalex":"https://openalex.org/W2120263102","doi":"https://doi.org/10.1145/1142351.1142374","mag":"2120263102"},"language":"en","primary_location":{"id":"doi:10.1145/1142351.1142374","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1142351.1142374","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the twenty-fifth ACM SIGMOD-SIGACT-SIGART symposium on Principles of database systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070757517","display_name":"Gagan Aggarwal","orcid":"https://orcid.org/0009-0003-3296-4891"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gagan Aggarwal","raw_affiliation_strings":["Google Inc., Mountain View, CA","Google Inc., Mountain View, CA#TAB#"],"affiliations":[{"raw_affiliation_string":"Google Inc., Mountain View, CA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google Inc., Mountain View, CA#TAB#","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109192583","display_name":"Tom\u00e1s Feder","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tom\u00e1s Feder","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002843568","display_name":"Krishnaram Kenthapadi","orcid":"https://orcid.org/0000-0003-1237-087X"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Krishnaram Kenthapadi","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042716179","display_name":"Samir Khuller","orcid":"https://orcid.org/0000-0002-5408-8023"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samir Khuller","raw_affiliation_strings":["University of Maryland, College Park, MD"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085651536","display_name":"Rina Panigrahy\u200e","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rina Panigrahy","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045549079","display_name":"Dilys Thomas","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dilys Thomas","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109121225","display_name":"An Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"An Zhu","raw_affiliation_strings":["Google Inc., Mountain View, CA","Google Inc., Mountain View, CA#TAB#"],"affiliations":[{"raw_affiliation_string":"Google Inc., Mountain View, CA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google Inc., Mountain View, CA#TAB#","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5070757517"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":43.3745,"has_fulltext":false,"cited_by_count":277,"citation_normalized_percentile":{"value":0.9986901,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"153","last_page":"162"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11598","display_name":"Internet Traffic Analysis and Secure E-voting","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.9818999767303467,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.785136342048645},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6851260662078857},{"id":"https://openalex.org/keywords/data-anonymization","display_name":"Data anonymization","score":0.632752537727356},{"id":"https://openalex.org/keywords/anonymity","display_name":"Anonymity","score":0.6079891324043274},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.5854201316833496},{"id":"https://openalex.org/keywords/data-publishing","display_name":"Data publishing","score":0.5356402397155762},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.48096218705177307},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.45989635586738586},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.45986223220825195},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.45404139161109924},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42178696393966675},{"id":"https://openalex.org/keywords/k-anonymity","display_name":"k-anonymity","score":0.4187832772731781},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.38141801953315735},{"id":"https://openalex.org/keywords/information-privacy","display_name":"Information privacy","score":0.3747705817222595},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.2739587426185608},{"id":"https://openalex.org/keywords/publishing","display_name":"Publishing","score":0.16267627477645874},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.11405852437019348},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.11322343349456787}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.785136342048645},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6851260662078857},{"id":"https://openalex.org/C2776945810","wikidata":"https://www.wikidata.org/wiki/Q17006654","display_name":"Data anonymization","level":3,"score":0.632752537727356},{"id":"https://openalex.org/C178005623","wikidata":"https://www.wikidata.org/wiki/Q308859","display_name":"Anonymity","level":2,"score":0.6079891324043274},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.5854201316833496},{"id":"https://openalex.org/C2781396290","wikidata":"https://www.wikidata.org/wiki/Q17051824","display_name":"Data publishing","level":3,"score":0.5356402397155762},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.48096218705177307},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.45989635586738586},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.45986223220825195},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.45404139161109924},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42178696393966675},{"id":"https://openalex.org/C2777706471","wikidata":"https://www.wikidata.org/wiki/Q17061432","display_name":"k-anonymity","level":3,"score":0.4187832772731781},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.38141801953315735},{"id":"https://openalex.org/C123201435","wikidata":"https://www.wikidata.org/wiki/Q456632","display_name":"Information privacy","level":2,"score":0.3747705817222595},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2739587426185608},{"id":"https://openalex.org/C151719136","wikidata":"https://www.wikidata.org/wiki/Q3972943","display_name":"Publishing","level":2,"score":0.16267627477645874},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.11405852437019348},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.11322343349456787},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1142351.1142374","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1142351.1142374","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the twenty-fifth ACM SIGMOD-SIGACT-SIGART symposium on Principles of database systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W76214014","https://openalex.org/W1891203375","https://openalex.org/W1971680805","https://openalex.org/W2003719999","https://openalex.org/W2011039300","https://openalex.org/W2052806235","https://openalex.org/W2055996587","https://openalex.org/W2073583237","https://openalex.org/W2104701012","https://openalex.org/W2124295613","https://openalex.org/W2134479759","https://openalex.org/W2159024459","https://openalex.org/W2161030490","https://openalex.org/W2161229593","https://openalex.org/W2169134473","https://openalex.org/W2476096155","https://openalex.org/W3122840867","https://openalex.org/W4285719527","https://openalex.org/W6603104669"],"related_works":["https://openalex.org/W2031844830","https://openalex.org/W2741549564","https://openalex.org/W2393528873","https://openalex.org/W2898931495","https://openalex.org/W2735807361","https://openalex.org/W2381826434","https://openalex.org/W3206397491","https://openalex.org/W3214359279","https://openalex.org/W2967268087","https://openalex.org/W1666070292"],"abstract_inverted_index":{"Publishing":[0],"data":[1,118,123,139,157,276],"for":[2,76,90,109,116,171,210,278,291],"analysis":[3,279],"from":[4,256],"a":[5,15,45,113,153,167,183,201,228,264],"table":[6],"containing":[7],"personal":[8],"records,":[9,119,140,270],"while":[10],"maintaining":[11],"individual":[12],"privacy,":[13],"is":[14,27,161,204,217,285],"problem":[16,213],"of":[17,24,48,63,122,137,156,208,219,237,249,267,296],"increasing":[18],"importance":[19],"today.":[20],"The":[21],"traditional":[22],"approach":[23],"de-identifying":[25],"records":[26,103,124],"to":[28,196,244,251],"remove":[29],"identifying":[30],"fields":[31],"such":[32,60,200],"as":[33,61,307],"social":[34],"security":[35],"number,":[36],"name":[37],"etc.":[38],"However,":[39],"recent":[40],"research":[41],"has":[42,280],"shown":[43],"that":[44,81,145,227,274],"large":[46],"fraction":[47,248,266],"the":[49,73,94,106,138,143,205,211,215,220,235,257,268,275],"US":[50],"population":[51],"can":[52,232,272],"be":[53,301],"identified":[54],"using":[55],"non-key":[56,79],"attributes":[57,80],"(called":[58],"quasi-identifiers)":[59],"date":[62],"birth,":[64],"gender,":[65],"and":[66,128,283,299],"zip":[67],"code":[68],"[15].":[69],"Sweeney":[70],"[16]":[71],"proposed":[72],"k-anonymity":[74],"model":[75],"privacy":[77,136],"where":[78,120,214],"leak":[82],"information":[83,186],"are":[84,98,125,132,295],"suppressed":[85],"or":[86],"generalized":[87],"so":[88],"that,":[89],"every":[91],"record":[92],"in":[93,303],"modified":[95],"table,":[96],"there":[97],"at":[99],"least":[100],"k\u22121":[101],"other":[102,304],"having":[104],"exactly":[105],"same":[107],"values":[108],"quasi-identifiers.":[110],"We":[111,190,224],"propose":[112],"new":[114,292],"method":[115],"anonymizing":[117],"quasi-identifiers":[121],"first":[126,206],"clustered":[127],"then":[129],"cluster":[130,147,172],"centers":[131,173],"published.":[133],"To":[134],"ensure":[135,273],"we":[141,165,240,271],"impose":[142],"constraint":[144],"each":[146],"must":[148],"contain":[149],"no":[150],"fewer":[151],"than":[152,174],"pre-specified":[154],"number":[155],"records.":[158],"This":[159,203],"technique":[160],"more":[162,185,286],"general":[163],"since":[164],"have":[166],"much":[168],"larger":[169],"choice":[170],"k-Anonymity.":[175],"In":[176],"many":[177],"cases,":[178],"it":[179],"lets":[180],"us":[181],"release":[182],"lot":[184],"without":[187],"compromising":[188],"privacy.":[189],"also":[191],"provide":[192],"constant-factor":[193],"approximation":[194,289],"algorithms":[195,209,243,290],"come":[197],"up":[198],"with":[199],"clustering.":[202],"set":[207],"anonymization":[212],"performance":[216],"independent":[218,297],"anonymity":[221],"parameter":[222],"k.":[223],"further":[225],"observe":[226],"few":[229],"outlier":[230],"points":[231,250],"significantly":[233],"increase":[234],"cost":[236],"anonymization.":[238],"Hence,":[239],"extend":[241],"our":[242],"allow":[245],"an":[246],"\u03b5":[247],"remain":[252],"unclustered,":[253],"i.e.,":[254],"deleted":[255],"anonymized":[258],"publication.":[259],"Thus,":[260],"by":[261],"not":[262],"releasing":[263],"small":[265],"database":[269],"published":[277],"less":[281],"distortion":[282],"hence":[284],"useful.":[287],"Our":[288],"clustering":[293,305],"objectives":[294],"interest":[298],"could":[300],"applicable":[302],"scenarios":[306],"well.":[308]},"counts_by_year":[{"year":2023,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":11},{"year":2016,"cited_by_count":15},{"year":2015,"cited_by_count":12},{"year":2014,"cited_by_count":11},{"year":2013,"cited_by_count":21},{"year":2012,"cited_by_count":25}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
