{"id":"https://openalex.org/W4281783139","doi":"https://doi.org/10.1145/3514221.3517864","title":"DataPrism: Exposing Disconnect between Data and Systems","display_name":"DataPrism: Exposing Disconnect between Data and Systems","publication_year":2022,"publication_date":"2022-06-10","ids":{"openalex":"https://openalex.org/W4281783139","doi":"https://doi.org/10.1145/3514221.3517864"},"language":"en","primary_location":{"id":"doi:10.1145/3514221.3517864","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3517864","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://orbilu.uni.lu/bitstream/10993/57629/1/3514221.3517864.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112842550","display_name":"Sainyam Galhotra","orcid":null},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]},{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sainyam Galhotra","raw_affiliation_strings":["University of Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I40347166","https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087503380","display_name":"Anna Fariha","orcid":"https://orcid.org/0000-0002-5275-7844"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anna Fariha","raw_affiliation_strings":["Microsoft, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Seattle, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035164855","display_name":"Raoni Louren\u00e7o","orcid":"https://orcid.org/0000-0001-7774-4487"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Raoni Louren\u00e7o","raw_affiliation_strings":["New York University, NYC, NY, USA"],"affiliations":[{"raw_affiliation_string":"New York University, NYC, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006773757","display_name":"Juliana Freire","orcid":"https://orcid.org/0000-0003-3915-7075"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juliana Freire","raw_affiliation_strings":["New York University, NYC, NY, USA"],"affiliations":[{"raw_affiliation_string":"New York University, NYC, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019048013","display_name":"Alexandra Meliou","orcid":"https://orcid.org/0000-0001-7346-6002"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexandra Meliou","raw_affiliation_strings":["University of Massachusetts Amherst, Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088315797","display_name":"Divesh Srivastava","orcid":"https://orcid.org/0000-0002-7609-9217"},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Divesh Srivastava","raw_affiliation_strings":["AT&amp;T Chief Data Office, Bedminster, NJ, USA"],"affiliations":[{"raw_affiliation_string":"AT&amp;T Chief Data Office, Bedminster, NJ, USA","institution_ids":["https://openalex.org/I1283103587"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5112842550"],"corresponding_institution_ids":["https://openalex.org/I39422238","https://openalex.org/I40347166"],"apc_list":null,"apc_paid":null,"fwci":1.7295,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.83954394,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"217","last_page":"231"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/debugging","display_name":"Debugging","score":0.8287352323532104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7276153564453125},{"id":"https://openalex.org/keywords/root-cause","display_name":"Root cause","score":0.7078014612197876},{"id":"https://openalex.org/keywords/software-bug","display_name":"Software bug","score":0.5454583168029785},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5276783108711243},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4876933991909027},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.45701295137405396},{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.4111475944519043},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.40804779529571533},{"id":"https://openalex.org/keywords/reliability-engineering","display_name":"Reliability engineering","score":0.2794744372367859},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.14940598607063293},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1455153524875641},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12330275774002075}],"concepts":[{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.8287352323532104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7276153564453125},{"id":"https://openalex.org/C84945661","wikidata":"https://www.wikidata.org/wiki/Q7366567","display_name":"Root cause","level":2,"score":0.7078014612197876},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.5454583168029785},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5276783108711243},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4876933991909027},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.45701295137405396},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.4111475944519043},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.40804779529571533},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.2794744372367859},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.14940598607063293},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1455153524875641},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12330275774002075},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3514221.3517864","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3517864","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"},{"id":"pmh:oai:orbilu.uni.lu:10993/57629","is_oa":true,"landing_page_url":"https://orbilu.uni.lu/handle/10993/57629","pdf_url":"https://orbilu.uni.lu/bitstream/10993/57629/1/3514221.3517864.pdf","source":{"id":"https://openalex.org/S4306401815","display_name":"Open Repository and Bibliography (University of Luxembourg)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I186903577","host_organization_name":"University of Luxembourg","host_organization_lineage":["https://openalex.org/I186903577"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"SIGMOD 2022 - Proceedings of the 2022 International Conference on Management of Data (2022-06-10); Proceedings of the 2022 International Conference on Management of Data, Philladelphia, Usa [Usa], 12-06-2022 => 17-06-2022","raw_type":"peer reviewed"}],"best_oa_location":{"id":"pmh:oai:orbilu.uni.lu:10993/57629","is_oa":true,"landing_page_url":"https://orbilu.uni.lu/handle/10993/57629","pdf_url":"https://orbilu.uni.lu/bitstream/10993/57629/1/3514221.3517864.pdf","source":{"id":"https://openalex.org/S4306401815","display_name":"Open Repository and Bibliography (University of Luxembourg)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I186903577","host_organization_name":"University of Luxembourg","host_organization_lineage":["https://openalex.org/I186903577"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"SIGMOD 2022 - Proceedings of the 2022 International Conference on Management of Data (2022-06-10); Proceedings of the 2022 International Conference on Management of Data, Philladelphia, Usa [Usa], 12-06-2022 => 17-06-2022","raw_type":"peer reviewed"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1382722559","display_name":null,"funder_award_id":"CCF-1763423, IIS-1943971,IIS-1916505, OAC-1934464","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4281783139.pdf","grobid_xml":"https://content.openalex.org/works/W4281783139.grobid-xml"},"referenced_works_count":49,"referenced_works":["https://openalex.org/W760598031","https://openalex.org/W1565102206","https://openalex.org/W1596552075","https://openalex.org/W1993760289","https://openalex.org/W2000809552","https://openalex.org/W2053075547","https://openalex.org/W2065000833","https://openalex.org/W2100155384","https://openalex.org/W2102489964","https://openalex.org/W2108132403","https://openalex.org/W2111607551","https://openalex.org/W2113302524","https://openalex.org/W2143522309","https://openalex.org/W2146747981","https://openalex.org/W2162376048","https://openalex.org/W2162449239","https://openalex.org/W2170712852","https://openalex.org/W2282821441","https://openalex.org/W2303408782","https://openalex.org/W2402668406","https://openalex.org/W2521016955","https://openalex.org/W2591700809","https://openalex.org/W2613751718","https://openalex.org/W2614062172","https://openalex.org/W2730550703","https://openalex.org/W2788403449","https://openalex.org/W2889801262","https://openalex.org/W2897042519","https://openalex.org/W2898098214","https://openalex.org/W2899327512","https://openalex.org/W2944436223","https://openalex.org/W2948130259","https://openalex.org/W2948234719","https://openalex.org/W2997315920","https://openalex.org/W2999876407","https://openalex.org/W3015276915","https://openalex.org/W3029990846","https://openalex.org/W3030026364","https://openalex.org/W3031898476","https://openalex.org/W3032405843","https://openalex.org/W3084564478","https://openalex.org/W3100279624","https://openalex.org/W3103264664","https://openalex.org/W3197847098","https://openalex.org/W4256084472","https://openalex.org/W4291714342","https://openalex.org/W4293162521","https://openalex.org/W4298949291","https://openalex.org/W6772730766"],"related_works":["https://openalex.org/W2111708921","https://openalex.org/W2740264376","https://openalex.org/W4206999239","https://openalex.org/W2900719967","https://openalex.org/W4388482952","https://openalex.org/W2161928627","https://openalex.org/W2786113878","https://openalex.org/W2787155073","https://openalex.org/W2727867943","https://openalex.org/W4322631505"],"abstract_inverted_index":{"As":[0],"data":[1,71,83,98,121,127,149,180],"is":[2,32,39,68,117,132],"a":[3,13,28,94,112,140,144,206],"central":[4],"component":[5],"of":[6,12,25,76,106,111,179,183,209,223],"many":[7],"modern":[8],"systems,":[9],"the":[10,19,35,60,79,103,124,148,155,160,184,216],"cause":[11],"system":[14,30,141,185],"malfunction":[15,44],"may":[16],"reside":[17],"in":[18,41,49,59,154,177],"data,":[20],"and,":[21],"specifically,":[22],"particular":[23],"properties":[24,99],"data.":[26,90],"E.g.,":[27],"health-monitoring":[29],"that":[31,37,86,89,101,166,199],"designed":[33],"under":[34],"assumption":[36],"weight":[38,47],"reported":[40,48],"lbs":[42],"will":[43],"when":[45,139],"encountering":[46],"kilograms.":[50],"Like":[51],"software":[52],"debugging,":[53],"which":[54],"aims":[55],"to":[56,69,72,96,119,159,205],"find":[57],"bugs":[58],"source":[61],"code":[62],"or":[63,109],"runtime":[64],"conditions,":[65],"our":[66],"goal":[67],"debug":[70],"identify":[73,97],"potential":[74],"sources":[75],"disconnect":[77,125],"between":[78,126],"assumptions":[80],"about":[81],"some":[82],"and":[84,122,128,151,194],"systems":[85,198],"operate":[87],"on":[88,134,191,201],"We":[91,187],"propose":[92],"DataPrism,":[93],"framework":[95],"(profiles)":[100],"are":[102],"root":[104,174,217],"causes":[105,175,218],"performance":[107],"degradation":[108],"failure":[110],"data-driven":[113,197],"system.":[114],"Such":[115],"identification":[116],"necessary":[118],"repair":[120],"resolve":[123],"systems.":[129],"Our":[130],"technique":[131],"based":[133],"causal":[135],"reasoning":[136],"through":[137],"interventions:":[138],"malfunctions":[142],"for":[143],"dataset,":[145],"DataPrism":[146,170,190,214],"alters":[147],"profiles":[150,181],"observes":[152],"changes":[153],"system's":[156],"behavior":[157],"due":[158,204],"alteration.":[161],"Unlike":[162],"statistical":[163],"observational":[164],"analysis":[165],"reports":[167,171],"mere":[168],"correlations,":[169],"causally":[172],"verified":[173],"--":[176,182],"terms":[178],"malfunction.":[186],"empirically":[188],"evaluate":[189],"seven":[192],"real-world":[193],"several":[195],"synthetic":[196],"fail":[200],"certain":[202],"datasets":[203],"diverse":[207],"set":[208],"reasons.":[210],"In":[211],"all":[212],"cases,":[213],"identifies":[215],"precisely":[219],"while":[220],"requiring":[221],"orders":[222],"magnitude":[224],"fewer":[225],"interventions":[226],"than":[227],"prior":[228],"techniques.":[229]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
