{"id":"https://openalex.org/W4413978214","doi":"https://doi.org/10.14778/3749646.3749721","title":"Stress-Testing ML Pipelines with Adversarial Data Corruption","display_name":"Stress-Testing ML Pipelines with Adversarial Data Corruption","publication_year":2025,"publication_date":"2025-07-01","ids":{"openalex":"https://openalex.org/W4413978214","doi":"https://doi.org/10.14778/3749646.3749721"},"language":"en","primary_location":{"id":"doi:10.14778/3749646.3749721","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3749646.3749721","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004156121","display_name":"Jiongli Zhu","orcid":"https://orcid.org/0000-0002-3238-8674"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jiongli Zhu","raw_affiliation_strings":["University of California, San Diego, USA"],"affiliations":[{"raw_affiliation_string":"University of California, San Diego, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017389050","display_name":"Guiyin Xu","orcid":"https://orcid.org/0000-0002-5959-4814"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Geyang Xu","raw_affiliation_strings":["University of California, San Diego, USA"],"affiliations":[{"raw_affiliation_string":"University of California, San Diego, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119535914","display_name":"Felipe Lorenzi","orcid":null},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Felipe Lorenzi","raw_affiliation_strings":["University of California, San Diego, USA"],"affiliations":[{"raw_affiliation_string":"University of California, San Diego, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061858093","display_name":"Boris Glavic","orcid":"https://orcid.org/0000-0003-2887-2452"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Boris Glavic","raw_affiliation_strings":["University of Illinois, Chicago, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois, Chicago, USA","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5092007889","display_name":"Babak Salimi","orcid":"https://orcid.org/0000-0001-8763-8354"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Babak Salimi","raw_affiliation_strings":["University of California, San Diego, USA"],"affiliations":[{"raw_affiliation_string":"University of California, San Diego, USA","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5004156121"],"corresponding_institution_ids":["https://openalex.org/I36258959"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13566634,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"18","issue":"11","first_page":"4668","last_page":"4681"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12122","display_name":"Physical Unclonable Functions (PUFs) and Hardware Security","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7186254262924194},{"id":"https://openalex.org/keywords/language-change","display_name":"Language change","score":0.5233837366104126},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.46724677085876465},{"id":"https://openalex.org/keywords/stress-testing","display_name":"Stress testing (software)","score":0.4539577066898346},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.41241875290870667},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3850991129875183},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.22157055139541626},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.12445688247680664},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08161962032318115},{"id":"https://openalex.org/keywords/mechanical-engineering","display_name":"Mechanical engineering","score":0.06625202298164368},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.058777958154678345}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7186254262924194},{"id":"https://openalex.org/C2780027415","wikidata":"https://www.wikidata.org/wiki/Q524648","display_name":"Language change","level":2,"score":0.5233837366104126},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.46724677085876465},{"id":"https://openalex.org/C7515471","wikidata":"https://www.wikidata.org/wiki/Q1936882","display_name":"Stress testing (software)","level":2,"score":0.4539577066898346},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.41241875290870667},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3850991129875183},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.22157055139541626},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.12445688247680664},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08161962032318115},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.06625202298164368},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.058777958154678345},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3749646.3749721","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3749646.3749721","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W15592790","https://openalex.org/W2024834471","https://openalex.org/W2116984840","https://openalex.org/W2725878222","https://openalex.org/W2964043980","https://openalex.org/W2964060211","https://openalex.org/W2997591727","https://openalex.org/W3125924446","https://openalex.org/W3126041148","https://openalex.org/W3164186389","https://openalex.org/W3165428735","https://openalex.org/W3173326111","https://openalex.org/W3176502563","https://openalex.org/W3212960901","https://openalex.org/W3214399478","https://openalex.org/W4241561347","https://openalex.org/W4281770862","https://openalex.org/W4285451014","https://openalex.org/W4308255668","https://openalex.org/W4308469411","https://openalex.org/W4317883989","https://openalex.org/W4322736917","https://openalex.org/W4381328625","https://openalex.org/W4408444355"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W4246396837","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W4310988119","https://openalex.org/W4285226279","https://openalex.org/W4288019534"],"abstract_inverted_index":{"Structured":[0],"data-quality":[1,63],"issues\u2014such":[2],"as":[3,112],"missing":[4],"values":[5],"correlated":[6],"with":[7],"demographics,":[8],"culturally":[9],"biased":[10],"labels,":[11],"or":[12,43,151],"systemic":[13],"selection":[14],"biases\u2014routinely":[15],"degrade":[16,80],"the":[17,102],"reliability":[18],"of":[19,138,159],"machine-learning":[20],"pipelines.":[21],"Regulators":[22],"now":[23],"increasingly":[24],"demand":[25],"evidence":[26],"that":[27,58,78,131],"high-stakes":[28],"systems":[29],"can":[30],"withstand":[31],"these":[32],"realistic,":[33],"interdependent":[34],"errors,":[35,154],"yet":[36],"current":[37],"robustness":[38,176],"evaluations":[39],"typically":[40],"use":[41],"random":[42,150],"overly":[44],"simplistic":[45],"corruptions,":[46],"leaving":[47],"worst-case":[48],"scenarios":[49],"unexplored.":[50],"We":[51],"introduce":[52],"Savage,":[53],"a":[54,81,87,113,133,165,172],"causally":[55],"inspired":[56],"framework":[57],"(i)":[59],"formally":[60],"models":[61],"realistic":[62],"issues":[64],"through":[65],"dependency":[66],"graphs":[67],"and":[68,72,97,108,121,155,178],"flexible":[69],"corruption":[70,76,99],"templates,":[71],"(ii)":[73],"systematically":[74],"discovers":[75],"patterns":[77],"maximally":[79],"target":[82],"performance":[83],"metric.":[84],"Savage":[85,143,163],"employs":[86],"bi-level":[88],"optimization":[89],"approach":[90],"to":[91],"efficiently":[92],"identify":[93],"vulnerable":[94],"data":[95,185],"subpopulations":[96],"fine-tune":[98],"severity,":[100],"treating":[101],"full":[103],"ML":[104,122],"pipeline,":[105],"including":[106],"preprocessing":[107],"potentially":[109],"non-differentiable":[110],"models,":[111],"black":[114],"box.":[115],"Extensive":[116],"experiments":[117],"across":[118],"multiple":[119],"datasets":[120],"tasks":[123],"(data":[124],"cleaning,":[125],"fairness-aware":[126],"learning,":[127],"uncertainty":[128],"quantification)":[129],"demonstrate":[130],"even":[132],"small":[134],"fraction":[135],"(around":[136],"5%)":[137],"structured":[139],"corruptions":[140],"identified":[141],"by":[142],"severely":[144],"impacts":[145],"model":[146],"performance,":[147],"far":[148],"exceeding":[149],"manually":[152],"crafted":[153],"invalidating":[156],"core":[157],"assumptions":[158],"existing":[160],"techniques.":[161],"Thus,":[162],"provides":[164],"practical":[166],"tool":[167],"for":[168,174,181],"rigorous":[169],"pipeline":[170],"stress-testing,":[171],"benchmark":[173],"evaluating":[175],"methods,":[177],"actionable":[179],"guidance":[180],"designing":[182],"more":[183],"resilient":[184],"workflows.":[186]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
