{"id":"https://openalex.org/W3012849342","doi":"https://doi.org/10.1145/3366423.3380045","title":"Clustering with a faulty oracle","display_name":"Clustering with a faulty oracle","publication_year":2020,"publication_date":"2020-04-20","ids":{"openalex":"https://openalex.org/W3012849342","doi":"https://doi.org/10.1145/3366423.3380045","mag":"3012849342"},"language":"en","primary_location":{"id":"doi:10.1145/3366423.3380045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3366423.3380045","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013551063","display_name":"Kasper Green Larsen","orcid":"https://orcid.org/0000-0001-8841-5929"},"institutions":[{"id":"https://openalex.org/I204337017","display_name":"Aarhus University","ror":"https://ror.org/01aj84f44","country_code":"DK","type":"education","lineage":["https://openalex.org/I204337017"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Kasper Green Larsen","raw_affiliation_strings":["Aarhus University"],"affiliations":[{"raw_affiliation_string":"Aarhus University","institution_ids":["https://openalex.org/I204337017"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062318856","display_name":"Michael Mitzenmacher","orcid":"https://orcid.org/0000-0001-5430-5457"},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Mitzenmacher","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069421706","display_name":"Charalampos E. Tsourakakis","orcid":"https://orcid.org/0000-0001-5591-3585"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Charalampos Tsourakakis","raw_affiliation_strings":["Boston University"],"affiliations":[{"raw_affiliation_string":"Boston University","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5013551063"],"corresponding_institution_ids":["https://openalex.org/I204337017"],"apc_list":null,"apc_paid":null,"fwci":0.4115,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.68303229,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"2831","last_page":"2834"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7410178780555725},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7167534828186035},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.5693897008895874},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.35394901037216187},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2906864285469055},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1813124716281891}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7410178780555725},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7167534828186035},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.5693897008895874},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35394901037216187},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2906864285469055},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1813124716281891}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3366423.3380045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},{"id":"pmh:oai:open.bu.edu:2144/41398","is_oa":false,"landing_page_url":"https://hdl.handle.net/2144/41398","pdf_url":null,"source":{"id":"https://openalex.org/S4306402384","display_name":"OpenBU (Boston University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I111088046","host_organization_name":"Boston University","host_organization_lineage":["https://openalex.org/I111088046"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference materials"},{"id":"pmh:oai:pure.atira.dk:openaire/7fe169e9-d0fe-4ccf-95a0-23abcff34268","is_oa":true,"landing_page_url":"https://pure.au.dk/portal/en/publications/7fe169e9-d0fe-4ccf-95a0-23abcff34268","pdf_url":null,"source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Green Larsen, K, Mitzenmacher, M & Tsourakakis, C 2020, Clustering with a faulty oracle. in Y Huang, I King, T-Y Liu & M van Steen (eds), WWW '20 : Proceedings of The Web Conference 2020. Association for Computing Machinery, New York, pp. 2831-2834, WWW '20, Taipei , Taiwan, 20/04/2020. https://doi.org/10.1145/3366423.3380045","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.atira.dk:publications/7fe169e9-d0fe-4ccf-95a0-23abcff34268","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85086596158&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306400063","display_name":"Scopus (Elsevier)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Green Larsen, K, Mitzenmacher, M & Tsourakakis, C 2020, Clustering with a faulty oracle. in Y Huang, I King, T-Y Liu & M van Steen (eds), WWW '20 : Proceedings of The Web Conference 2020. Association for Computing Machinery, New York, pp. 2831-2834, WWW '20, Taipei , Taiwan, 20/04/2020. https://doi.org/10.1145/3366423.3380045","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1145/3366423.3380045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1496255159","https://openalex.org/W1595409123","https://openalex.org/W1605711022","https://openalex.org/W1992402718","https://openalex.org/W1993111701","https://openalex.org/W2011430131","https://openalex.org/W2060990051","https://openalex.org/W2067883080","https://openalex.org/W2073415627","https://openalex.org/W2073459066","https://openalex.org/W2097186564","https://openalex.org/W2098044836","https://openalex.org/W2106944855","https://openalex.org/W2107223449","https://openalex.org/W2108399535","https://openalex.org/W2109682749","https://openalex.org/W2111040408","https://openalex.org/W2113239207","https://openalex.org/W2130519052","https://openalex.org/W2142517301","https://openalex.org/W2145096794","https://openalex.org/W2165432920","https://openalex.org/W2165874743","https://openalex.org/W2488678869","https://openalex.org/W2567866584","https://openalex.org/W2605800612","https://openalex.org/W2614891641","https://openalex.org/W2704180839","https://openalex.org/W2807267202","https://openalex.org/W2914959486","https://openalex.org/W2963264680","https://openalex.org/W2963829083","https://openalex.org/W2973282627","https://openalex.org/W3097350880","https://openalex.org/W3098152555","https://openalex.org/W6668990524"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2073713056","https://openalex.org/W3110702597","https://openalex.org/W2078761926","https://openalex.org/W2110441383","https://openalex.org/W2125620709","https://openalex.org/W1498872724","https://openalex.org/W2390279801"],"abstract_inverted_index":{"Clustering,":[0],"i.e.,":[1],"finding":[2],"groups":[3],"in":[4,44],"the":[5,19,54,95,101,104,123],"data,":[6],"is":[7,106],"a":[8,24],"problem":[9,20],"that":[10],"permeates":[11],"multiple":[12],"fields":[13],"of":[14,21,42,89],"science":[15],"and":[16,39,65,68,70],"engineering.":[17],"Recently,":[18],"clustering":[22],"with":[23,108],"noisy":[25],"oracle":[26],"has":[27],"drawn":[28],"attention":[29],"due":[30],"to":[31,78,85,94,103],"various":[32],"applications":[33],"including":[34],"crowdsourced":[35],"entity":[36],"resolution":[37],"[33],":[38],"predicting":[40],"signs":[41],"interactions":[43],"large-scale":[45],"online":[46],"social":[47],"networks":[48],"[20,":[49],"21].":[50],"Here,":[51],"we":[52],"consider":[53],"following":[55],"fundamental":[56],"model":[57],"for":[58],"two":[59,79],"clusters":[60],"as":[61],"proposed":[62],"by":[63],"Mitzenmacher":[64],"Tsourakakis":[66],"[28],":[67],"Mazumdar":[69],"Saha":[71],"[25];":[72],"there":[73],"exist":[74],"n":[75],"items,":[76],"belonging":[77],"unknown":[80],"groups.":[81],"We":[82],"are":[83],"allowed":[84],"query":[86,105],"any":[87],"pair":[88],"nodes":[90],"whether":[91],"they":[92],"belong":[93],"same":[96],"cluster":[97],"or":[98],"not,":[99],"but":[100],"answer":[102],"corrupted":[107],"some":[109],"probability":[110],".":[111],"Let":[112],"1":[113,117],">":[114,120],"\u03b4":[115],"=":[116],"\u2212":[118],"2q":[119],"0":[121],"be":[122],"bias.":[124]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2020-03-27T00:00:00"}
