{"id":"https://openalex.org/W2532450507","doi":"https://doi.org/10.1145/2983323.2983679","title":"Qualitative Cleaning of Uncertain Data","display_name":"Qualitative Cleaning of Uncertain Data","publication_year":2016,"publication_date":"2016-10-24","ids":{"openalex":"https://openalex.org/W2532450507","doi":"https://doi.org/10.1145/2983323.2983679","mag":"2532450507"},"language":"en","primary_location":{"id":"doi:10.1145/2983323.2983679","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2983323.2983679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th ACM International on Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006183138","display_name":"Henning K\u00f6ehler","orcid":"https://orcid.org/0000-0002-4688-920X"},"institutions":[{"id":"https://openalex.org/I51158804","display_name":"Massey University","ror":"https://ror.org/052czxv31","country_code":"NZ","type":"education","lineage":["https://openalex.org/I51158804"]}],"countries":["NZ"],"is_corresponding":true,"raw_author_name":"Henning Koehler","raw_affiliation_strings":["Massey University, Palmerston North, New Zealand"],"affiliations":[{"raw_affiliation_string":"Massey University, Palmerston North, New Zealand","institution_ids":["https://openalex.org/I51158804"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069839542","display_name":"Sebastian Link","orcid":"https://orcid.org/0000-0002-1816-2863"},"institutions":[{"id":"https://openalex.org/I154130895","display_name":"University of Auckland","ror":"https://ror.org/03b94tp07","country_code":"NZ","type":"education","lineage":["https://openalex.org/I154130895"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Sebastian Link","raw_affiliation_strings":["The University of Auckland, Auckland, New Zealand"],"affiliations":[{"raw_affiliation_string":"The University of Auckland, Auckland, New Zealand","institution_ids":["https://openalex.org/I154130895"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5006183138"],"corresponding_institution_ids":["https://openalex.org/I51158804"],"apc_list":null,"apc_paid":null,"fwci":1.4362,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.85239622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2269","last_page":"2274"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9714000225067139,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.961899995803833,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.8188233375549316},{"id":"https://openalex.org/keywords/vertex-cover","display_name":"Vertex cover","score":0.6915927529335022},{"id":"https://openalex.org/keywords/vertex","display_name":"Vertex (graph theory)","score":0.6741552352905273},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.6130587458610535},{"id":"https://openalex.org/keywords/cover","display_name":"Cover (algebra)","score":0.5481486916542053},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5089676380157471},{"id":"https://openalex.org/keywords/constraint-satisfaction-problem","display_name":"Constraint satisfaction problem","score":0.46084973216056824},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.45491719245910645},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4083041846752167},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.363244891166687},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.35613739490509033},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3538842499256134},{"id":"https://openalex.org/keywords/approximation-algorithm","display_name":"Approximation algorithm","score":0.28609853982925415},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.17087587714195251},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.13540714979171753},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.08305096626281738}],"concepts":[{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.8188233375549316},{"id":"https://openalex.org/C40687702","wikidata":"https://www.wikidata.org/wiki/Q11515519","display_name":"Vertex cover","level":3,"score":0.6915927529335022},{"id":"https://openalex.org/C80899671","wikidata":"https://www.wikidata.org/wiki/Q1304193","display_name":"Vertex (graph theory)","level":3,"score":0.6741552352905273},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.6130587458610535},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.5481486916542053},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5089676380157471},{"id":"https://openalex.org/C199622910","wikidata":"https://www.wikidata.org/wiki/Q1128326","display_name":"Constraint satisfaction problem","level":3,"score":0.46084973216056824},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.45491719245910645},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4083041846752167},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.363244891166687},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.35613739490509033},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3538842499256134},{"id":"https://openalex.org/C148764684","wikidata":"https://www.wikidata.org/wiki/Q621751","display_name":"Approximation algorithm","level":2,"score":0.28609853982925415},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.17087587714195251},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.13540714979171753},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.08305096626281738},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2983323.2983679","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2983323.2983679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th ACM International on Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W380795639","https://openalex.org/W885593463","https://openalex.org/W1873489833","https://openalex.org/W1982345710","https://openalex.org/W1984302133","https://openalex.org/W1988443389","https://openalex.org/W1997945384","https://openalex.org/W2004443904","https://openalex.org/W2039548475","https://openalex.org/W2041442195","https://openalex.org/W2077518845","https://openalex.org/W2078132546","https://openalex.org/W2081037581","https://openalex.org/W2082563279","https://openalex.org/W2107309064","https://openalex.org/W2116087731","https://openalex.org/W2171204442","https://openalex.org/W2240640875","https://openalex.org/W2249542348","https://openalex.org/W2294301821","https://openalex.org/W2295468252","https://openalex.org/W2338322935","https://openalex.org/W2401610261","https://openalex.org/W2411051717","https://openalex.org/W2411740706","https://openalex.org/W2437617937","https://openalex.org/W2440730883","https://openalex.org/W2462538567","https://openalex.org/W2569536984","https://openalex.org/W2573378428","https://openalex.org/W3138538843","https://openalex.org/W4239610380","https://openalex.org/W4298054708","https://openalex.org/W4300807684","https://openalex.org/W4388282953","https://openalex.org/W6635454507"],"related_works":["https://openalex.org/W4245395944","https://openalex.org/W2143551613","https://openalex.org/W1979740464","https://openalex.org/W2143345456","https://openalex.org/W2138823233","https://openalex.org/W1789991335","https://openalex.org/W2562731034","https://openalex.org/W4315705795","https://openalex.org/W2101053337","https://openalex.org/W2783796426"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,69,85,115],"new":[3,70],"view":[4],"on":[5],"data":[6,9,18,49],"cleaning:":[7],"Not":[8],"itself":[10],"but":[11],"the":[12,74,96,107,124,127,141],"degrees":[13,27,38,62,108],"of":[14,28,39,55,63,73,109,126,149,157],"uncertainty":[15,158],"attributed":[16],"to":[17,43,68,84,113],"are":[19,25,36],"dirty.":[20],"Applying":[21],"possibility":[22,29,110],"theory,":[23],"tuples":[24,45],"assigned":[26,37],"with":[30,154],"which":[31,44],"they":[32,46],"occur,":[33],"and":[34,111,151],"constraints":[35],"certainty":[40,112],"that":[41,118,133],"say":[42],"apply.":[47],"Classical":[48],"cleaning":[50],"modifies":[51],"some":[52],"minimal":[53],"set":[54],"tuples.":[56],"Instead,":[57,104],"we":[58,105],"marginally":[59],"reduce":[60],"their":[61],"possibility.":[64],"This":[65],"reduction":[66],"leads":[67],"qualitative":[71,128],"version":[72],"vertex":[75,79,102,129,143],"cover":[76,80,144],"problem.":[77,89],"Qualitative":[78],"can":[81],"be":[82],"mapped":[83],"linear-weighted":[86],"constraint":[87],"satisfaction":[88],"However,":[90],"any":[91],"off-the-shelf":[92],"solver":[93],"cannot":[94],"solve":[95],"problem":[97,145],"more":[98],"efficiently":[99],"than":[100,138],"classical":[101,142],"cover.":[103,130],"utilize":[106],"develop":[114],"dedicated":[116],"algorithm":[117,135],"is":[119,136],"fixed":[120],"parameter":[121],"tractable":[122],"in":[123],"size":[125],"Experiments":[131],"show":[132],"our":[134],"faster":[137],"solvers":[139],"for":[140],"by":[146],"several":[147],"orders":[148],"magnitude,":[150],"performance":[152],"improves":[153],"higher":[155],"numbers":[156],"degrees.":[159]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
