{"id":"https://openalex.org/W4408060288","doi":"https://doi.org/10.14778/3705829.3705860","title":"The Cost of Representation by Subset Repairs","display_name":"The Cost of Representation by Subset Repairs","publication_year":2024,"publication_date":"2024-10-01","ids":{"openalex":"https://openalex.org/W4408060288","doi":"https://doi.org/10.14778/3705829.3705860"},"language":"en","primary_location":{"id":"doi:10.14778/3705829.3705860","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3705829.3705860","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100602636","display_name":"Yu-xi Liu","orcid":"https://orcid.org/0000-0002-3961-2691"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuxi Liu","raw_affiliation_strings":["Duke University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Duke University","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109241534","display_name":"Fangzhu Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fangzhu Shen","raw_affiliation_strings":["Duke University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Duke University","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kushagra Ghosh","orcid":null},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kushagra Ghosh","raw_affiliation_strings":["Duke University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Duke University","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027907153","display_name":"Amir Gilad","orcid":"https://orcid.org/0000-0002-3764-1958"},"institutions":[{"id":"https://openalex.org/I121297525","display_name":"Hebrew College","ror":"https://ror.org/05y3p3k12","country_code":"US","type":"education","lineage":["https://openalex.org/I121297525"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amir Gilad","raw_affiliation_strings":["Hebrew University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hebrew University","institution_ids":["https://openalex.org/I121297525"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006706357","display_name":"Benny Kimelfeld","orcid":"https://orcid.org/0000-0002-7156-1572"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Benny Kimelfeld","raw_affiliation_strings":["Technion"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technion","institution_ids":["https://openalex.org/I174306211"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012463450","display_name":"Sudeepa Roy","orcid":null},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sudeepa Roy","raw_affiliation_strings":["Duke University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Duke University","institution_ids":["https://openalex.org/I170897317"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.68981257,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"18","issue":"2","first_page":"475","last_page":"487"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12002","display_name":"Computability, Logic, AI Algorithms","score":0.9657999873161316,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9330000281333923,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5378699898719788},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5038785338401794},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3342222273349762},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.04915809631347656}],"concepts":[{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5378699898719788},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5038785338401794},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3342222273349762},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.04915809631347656},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3705829.3705860","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3705829.3705860","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1492221961","https://openalex.org/W1989783863","https://openalex.org/W2014352947","https://openalex.org/W2044469685","https://openalex.org/W2046298800","https://openalex.org/W2059693475","https://openalex.org/W2064600658","https://openalex.org/W2064766209","https://openalex.org/W2081186682","https://openalex.org/W2153531471","https://openalex.org/W2162449239","https://openalex.org/W2163600218","https://openalex.org/W2405916311","https://openalex.org/W2522104760","https://openalex.org/W2548122763","https://openalex.org/W2569536984","https://openalex.org/W2591700809","https://openalex.org/W2612661634","https://openalex.org/W2941766203","https://openalex.org/W2948130259","https://openalex.org/W2964031043","https://openalex.org/W2964675004","https://openalex.org/W3008589870","https://openalex.org/W3015738839","https://openalex.org/W3030496122","https://openalex.org/W3089767549","https://openalex.org/W3094989159","https://openalex.org/W3110372784","https://openalex.org/W3125789530","https://openalex.org/W3173144982","https://openalex.org/W3210668460","https://openalex.org/W4287659481","https://openalex.org/W4289534040","https://openalex.org/W4386564359","https://openalex.org/W4389539805"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4391375266","https://openalex.org/W1979597421","https://openalex.org/W2007980826","https://openalex.org/W2061531152","https://openalex.org/W3002753104","https://openalex.org/W2077600819","https://openalex.org/W2142036596","https://openalex.org/W2072657027"],"abstract_inverted_index":{"Datasets":[0],"may":[1,35,45],"include":[2],"errors,":[3],"and":[4,31,82,145,171],"specifically":[5],"violations":[6,21],"of":[7,38,67,97,112,142,151,181,187,196],"integrity":[8,129],"constraints,":[9],"for":[10,15,24,80,88,102,135,168,174],"various":[11],"reasons.":[12],"Standard":[13],"techniques":[14],"\"minimalcost\"":[16],"database":[17],"repairing":[18],"resolve":[19],"these":[20],"by":[22],"aiming":[23],"a":[25,57,179],"minimum":[26],"change":[27],"in":[28,32,69,99,162,190],"the":[29,33,43,95,110,128,140,149,158,185,194],"data,":[30],"process,":[34],"sway":[36],"representations":[37],"different":[39,70],"sub-populations.":[40,71,137],"For":[41],"instance,":[42],"repair":[44],"end":[46],"up":[47],"deleting":[48],"more":[49,54],"females":[50],"than":[51],"males,":[52],"or":[53,61,192],"tuples":[55,116],"from":[56],"certain":[58],"age":[59],"group":[60],"race,":[62],"due":[63],"to":[64,85,118,124],"varying":[65],"levels":[66],"inconsistency":[68],"Such":[72],"repaired":[73],"data":[74],"can":[75,83],"mislead":[76],"consumers":[77],"when":[78],"used":[79],"analytics,":[81],"lead":[84],"biased":[86],"decisions":[87],"downstream":[89],"machine":[90],"learning":[91],"tasks.":[92],"We":[93,138,177],"study":[94,139],"\"cost":[96],"representation\"":[98],"subset":[100,153],"repairs":[101,154],"functional":[103],"dependencies.":[104],"In":[105],"simple":[106],"terms,":[107],"we":[108,122,164],"target":[109],"question":[111],"how":[113],"many":[114],"additional":[115],"have":[117],"be":[119],"deleted":[120],"if":[121],"want":[123],"satisfy":[125],"not":[126],"only":[127],"constraints":[130,134],"but":[131],"also":[132],"representation":[133],"given":[136],"complexity":[141,150],"this":[143],"problem":[144,159],"compare":[146],"it":[147],"with":[148],"optimal":[152],"without":[155],"representations.":[156],"While":[157],"is":[160],"NP-hard":[161],"general,":[163],"give":[165],"polynomial-time":[166],"algorithms":[167,189],"special":[169],"cases,":[170],"efficient":[172],"heuristics":[173],"general":[175],"cases.":[176],"perform":[178],"suite":[180],"experiments":[182],"that":[183],"show":[184],"effectiveness":[186],"our":[188],"computing":[191],"approximating":[193],"cost":[195],"representation.":[197]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
