{"id":"https://openalex.org/W2966851149","doi":"https://doi.org/10.1145/3332186.3332222","title":"Integrity Protection for Scientific Workflow Data","display_name":"Integrity Protection for Scientific Workflow Data","publication_year":2019,"publication_date":"2019-07-28","ids":{"openalex":"https://openalex.org/W2966851149","doi":"https://doi.org/10.1145/3332186.3332222","mag":"2966851149"},"language":"en","primary_location":{"id":"doi:10.1145/3332186.3332222","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3332186.3332222","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3332186.3332222","source":{"id":"https://openalex.org/S4306524297","display_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3332186.3332222","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079942660","display_name":"Mats Rynge","orcid":"https://orcid.org/0000-0002-1779-7189"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mats Rynge","raw_affiliation_strings":["Information Sciences Institute - University of Southern, California"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute - University of Southern, California","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055471608","display_name":"Karan Vahi","orcid":"https://orcid.org/0000-0001-8622-2082"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Karan Vahi","raw_affiliation_strings":["Information Sciences Institute - University of Southern, California"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute - University of Southern, California","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031941569","display_name":"Ewa Deelman","orcid":"https://orcid.org/0000-0001-5106-503X"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ewa Deelman","raw_affiliation_strings":["Information Sciences Institute - University of Southern, California"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute - University of Southern, California","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063480283","display_name":"Anirban Mandal","orcid":"https://orcid.org/0000-0001-5145-8618"},"institutions":[{"id":"https://openalex.org/I69048370","display_name":"Renaissance Computing Institute","ror":"https://ror.org/01s91ey96","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535","https://openalex.org/I170897317","https://openalex.org/I69048370"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anirban Mandal","raw_affiliation_strings":["RENCI - University of North Carolina, Chapel Hill"],"affiliations":[{"raw_affiliation_string":"RENCI - University of North Carolina, Chapel Hill","institution_ids":["https://openalex.org/I69048370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050863093","display_name":"Ilya Baldin","orcid":"https://orcid.org/0000-0001-7158-0143"},"institutions":[{"id":"https://openalex.org/I69048370","display_name":"Renaissance Computing Institute","ror":"https://ror.org/01s91ey96","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535","https://openalex.org/I170897317","https://openalex.org/I69048370"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ilya Baldin","raw_affiliation_strings":["RENCI - University of North Carolina, Chapel Hill"],"affiliations":[{"raw_affiliation_string":"RENCI - University of North Carolina, Chapel Hill","institution_ids":["https://openalex.org/I69048370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085246999","display_name":"Omkar Bhide","orcid":null},"institutions":[{"id":"https://openalex.org/I592451","display_name":"Indiana University","ror":"https://ror.org/01kg8sb98","country_code":"US","type":"education","lineage":["https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Omkar Bhide","raw_affiliation_strings":["Indiana University"],"affiliations":[{"raw_affiliation_string":"Indiana University","institution_ids":["https://openalex.org/I592451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058904152","display_name":"Randy Heiland","orcid":"https://orcid.org/0000-0002-7440-2905"},"institutions":[{"id":"https://openalex.org/I592451","display_name":"Indiana University","ror":"https://ror.org/01kg8sb98","country_code":"US","type":"education","lineage":["https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Randy Heiland","raw_affiliation_strings":["Indiana University"],"affiliations":[{"raw_affiliation_string":"Indiana University","institution_ids":["https://openalex.org/I592451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042723051","display_name":"Von Welch","orcid":"https://orcid.org/0000-0002-5896-7789"},"institutions":[{"id":"https://openalex.org/I592451","display_name":"Indiana University","ror":"https://ror.org/01kg8sb98","country_code":"US","type":"education","lineage":["https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Von Welch","raw_affiliation_strings":["Indiana University"],"affiliations":[{"raw_affiliation_string":"Indiana University","institution_ids":["https://openalex.org/I592451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045850342","display_name":"Raquel Hill","orcid":"https://orcid.org/0000-0001-7963-5540"},"institutions":[{"id":"https://openalex.org/I592451","display_name":"Indiana University","ror":"https://ror.org/01kg8sb98","country_code":"US","type":"education","lineage":["https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Raquel Hill","raw_affiliation_strings":["Indiana University"],"affiliations":[{"raw_affiliation_string":"Indiana University","institution_ids":["https://openalex.org/I592451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072869296","display_name":"William L. Poehlman","orcid":"https://orcid.org/0000-0002-3659-9663"},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William L. Poehlman","raw_affiliation_strings":["Clemson University"],"affiliations":[{"raw_affiliation_string":"Clemson University","institution_ids":["https://openalex.org/I8078737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043213807","display_name":"F. Alex Feltus","orcid":"https://orcid.org/0000-0002-2123-6114"},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"F. Alex Feltus","raw_affiliation_strings":["Clemson University"],"affiliations":[{"raw_affiliation_string":"Clemson University","institution_ids":["https://openalex.org/I8078737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5079942660"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":3.5203,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.94953477,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/checksum","display_name":"Checksum","score":0.8516668081283569},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8069735765457153},{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.7596033215522766},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7095447778701782},{"id":"https://openalex.org/keywords/encryption","display_name":"Encryption","score":0.46313053369522095},{"id":"https://openalex.org/keywords/erasure-code","display_name":"Erasure code","score":0.41537585854530334},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.4065665006637573},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.36482420563697815},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.16636168956756592}],"concepts":[{"id":"https://openalex.org/C162372511","wikidata":"https://www.wikidata.org/wiki/Q218341","display_name":"Checksum","level":2,"score":0.8516668081283569},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8069735765457153},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.7596033215522766},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7095447778701782},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.46313053369522095},{"id":"https://openalex.org/C137529215","wikidata":"https://www.wikidata.org/wiki/Q5385031","display_name":"Erasure code","level":3,"score":0.41537585854530334},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.4065665006637573},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.36482420563697815},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.16636168956756592},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3332186.3332222","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3332186.3332222","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3332186.3332222","source":{"id":"https://openalex.org/S4306524297","display_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3332186.3332222","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3332186.3332222","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3332186.3332222","source":{"id":"https://openalex.org/S4306524297","display_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8100000023841858,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G3415494668","display_name":"Collaborative Research: CICI: Secure and Resilient Architecture: Scientific Workflow Integrity with Pegasus","funder_award_id":"1642070","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4691017392","display_name":"Collaborative Research: CICI: Secure and Resilient Architecture: Scientific Workflow Integrity with Pegasus.","funder_award_id":"1642090","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6840893325","display_name":null,"funder_award_id":"1664162","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7340972926","display_name":null,"funder_award_id":"other","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G8026541174","display_name":"Collaborative Research: CICI: Secure and Resilient Architecture: Scientific Workflow Integrity with Pegasus","funder_award_id":"1642053","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8727083658","display_name":null,"funder_award_id":"1148698","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320332359","display_name":"Office of Science","ror":"https://ror.org/00mmn6b08"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2966851149.pdf","grobid_xml":"https://content.openalex.org/works/W2966851149.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W67188827","https://openalex.org/W1588132832","https://openalex.org/W1959194376","https://openalex.org/W2043701535","https://openalex.org/W2053856160","https://openalex.org/W2055658655","https://openalex.org/W2071358630","https://openalex.org/W2088379928","https://openalex.org/W2098921755","https://openalex.org/W2124088880","https://openalex.org/W2166459269","https://openalex.org/W2496673950","https://openalex.org/W2499147289","https://openalex.org/W2583342949","https://openalex.org/W2731994290","https://openalex.org/W2742474178","https://openalex.org/W2766445584","https://openalex.org/W2775500188","https://openalex.org/W2888555477","https://openalex.org/W2899895887","https://openalex.org/W3011856351","https://openalex.org/W4206816857","https://openalex.org/W4244630465","https://openalex.org/W4318211321"],"related_works":["https://openalex.org/W2584928298","https://openalex.org/W2073512695","https://openalex.org/W4285328204","https://openalex.org/W2126447415","https://openalex.org/W2188809546","https://openalex.org/W2136646084","https://openalex.org/W2966851149","https://openalex.org/W2182068290","https://openalex.org/W4253616297","https://openalex.org/W2617986690"],"abstract_inverted_index":{"With":[0],"the":[1,8,12,22,31,34,66,142],"continued":[2],"rise":[3],"of":[4,14,33,125,173,192],"scientific":[5,35],"computing":[6],"and":[7,26,45,68,83,101,179],"enormous":[9],"increases":[10],"in":[11,47,60,111],"size":[13],"data":[15,28,99,113,127,177],"being":[16],"processed,":[17],"scientists":[18],"must":[19],"consider":[20],"whether":[21],"processes":[23],"for":[24,137,161],"transmitting":[25],"storing":[27],"sufficiently":[29],"assure":[30],"integrity":[32,38,87,128,163,174,193],"data.":[36],"When":[37],"is":[39],"not":[40,63,95,103],"preserved,":[41],"computations":[42],"can":[43,57,115],"fail":[44],"result":[46],"increased":[48],"computational":[49],"cost":[50],"due":[51],"to":[52,65,97,169,183],"reruns,":[53],"or":[54,133],"worse,":[55],"results":[56],"be":[58],"corrupted":[59],"a":[61,105,156,171],"manner":[62],"apparent":[64],"scientist":[67],"produce":[69],"invalid":[70],"science":[71],"results.":[72],"Technologies":[73],"such":[74],"as":[75],"TCP":[76],"checksums,":[77],"encrypted":[78],"transfers,":[79],"checksum":[80],"validation,":[81],"RAID":[82],"erasure":[84],"coding":[85],"provide":[86,190],"assurances":[88],"at":[89],"different":[90],"levels,":[91],"but":[92],"they":[93],"may":[94,102],"scale":[96],"large":[98],"sizes":[100],"cover":[104],"workflow":[106,138],"from":[107],"end-to-end,":[108],"leaving":[109],"gaps":[110],"which":[112],"corruption":[114,135],"occur":[116],"undetected.":[117],"In":[118,181],"this":[119],"paper":[120],"we":[121,151,189,196],"explore":[122],"an":[123,159],"approach":[124],"assuring":[126],"-":[129,136,155],"considering":[130],"either":[131],"malicious":[132],"accidental":[134],"executions":[139],"orchestrated":[140],"by":[141,166],"Pegasus":[143],"Workflow":[144],"Management":[145],"System.":[146],"To":[147],"validate":[148],"our":[149],"approach,":[150],"introduce":[152,170],"Chaos":[153,187],"Jungle":[154],"toolkit":[157],"providing":[158],"environment":[160],"validating":[162],"verification":[164],"mechanisms":[165],"allowing":[167],"researchers":[168],"variety":[172],"errors":[175,194],"during":[176],"transfers":[178],"storage.":[180],"addition":[182],"controlled":[184],"experiments":[185],"with":[186],"Jungle,":[188],"analysis":[191],"that":[195],"encountered":[197],"when":[198],"running":[199],"production":[200],"workflows.":[201]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-10-10T00:00:00"}
