{"id":"https://openalex.org/W2005998283","doi":"https://doi.org/10.1145/2742854.2742903","title":"Programmer-directed partial redundancy for resilient HPC","display_name":"Programmer-directed partial redundancy for resilient HPC","publication_year":2015,"publication_date":"2015-05-06","ids":{"openalex":"https://openalex.org/W2005998283","doi":"https://doi.org/10.1145/2742854.2742903","mag":"2005998283"},"language":"en","primary_location":{"id":"doi:10.1145/2742854.2742903","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2742854.2742903","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th ACM International Conference on Computing Frontiers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/2117/91299","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034946156","display_name":"Omer Subasi","orcid":"https://orcid.org/0000-0002-5373-7570"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Omer Subasi","raw_affiliation_strings":["Universitat Politecnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Politecnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110004560","display_name":"Javier Arias","orcid":null},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Javier Arias","raw_affiliation_strings":["Universitat Politecnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Politecnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075162875","display_name":"Osman \u00dcnsal","orcid":"https://orcid.org/0000-0002-0544-9697"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Osman Unsal","raw_affiliation_strings":["Universitat Politecnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Politecnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035035680","display_name":"Jes\u00fas Labarta","orcid":"https://orcid.org/0000-0002-7489-4727"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Jesus Labarta","raw_affiliation_strings":["Universitat Politecnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Politecnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084390427","display_name":"Adri\u00e1n Cristal","orcid":"https://orcid.org/0000-0003-1277-9296"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Adrian Cristal","raw_affiliation_strings":["Universitat Politecnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Politecnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5034946156"],"corresponding_institution_ids":["https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":5.9559,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.96416158,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/programmer","display_name":"Programmer","score":0.8824188709259033},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.841732382774353},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.7216730713844299},{"id":"https://openalex.org/keywords/fault-tolerance","display_name":"Fault tolerance","score":0.6890614628791809},{"id":"https://openalex.org/keywords/replication","display_name":"Replication (statistics)","score":0.6751124858856201},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5146409273147583},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4771656095981598},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.47570592164993286},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3958161473274231},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3413185477256775},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.30188921093940735}],"concepts":[{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.8824188709259033},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.841732382774353},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.7216730713844299},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.6890614628791809},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.6751124858856201},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5146409273147583},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4771656095981598},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.47570592164993286},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3958161473274231},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3413185477256775},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.30188921093940735},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2742854.2742903","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2742854.2742903","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th ACM International Conference on Computing Frontiers","raw_type":"proceedings-article"},{"id":"pmh:oai:recercat.cat:2072/340846","is_oa":true,"landing_page_url":"http://hdl.handle.net/2117/91299","pdf_url":null,"source":{"id":"https://openalex.org/S4306402147","display_name":"RECERCAT (Consorci de Serveis Universitaris de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210090028","host_organization_name":"Consorci de Serveis Universitaris de Catalunya","host_organization_lineage":["https://openalex.org/I4210090028"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:recercat.cat:2072/340846","is_oa":true,"landing_page_url":"http://hdl.handle.net/2117/91299","pdf_url":null,"source":{"id":"https://openalex.org/S4306402147","display_name":"RECERCAT (Consorci de Serveis Universitaris de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210090028","host_organization_name":"Consorci de Serveis Universitaris de Catalunya","host_organization_lineage":["https://openalex.org/I4210090028"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W47306539","https://openalex.org/W2036641664","https://openalex.org/W2070638479","https://openalex.org/W2105524676","https://openalex.org/W2142677441","https://openalex.org/W2485170526"],"related_works":["https://openalex.org/W2153096481","https://openalex.org/W2148616436","https://openalex.org/W2102525122","https://openalex.org/W4245282135","https://openalex.org/W4306316843","https://openalex.org/W2130594209","https://openalex.org/W2036953450","https://openalex.org/W4300955944","https://openalex.org/W2170004886","https://openalex.org/W2527822502"],"abstract_inverted_index":{"In":[0],"this":[1],"work":[2],"we":[3,36],"propose":[4],"partial":[5],"task":[6],"replication":[7,24,40],"and":[8,54],"checkpointing":[9],"for":[10],"task-parallel":[11],"HPC":[12],"applications":[13],"to":[14,33,42],"mitigate":[15],"silent":[16],"data":[17],"corruption":[18],"(SDC)":[19],"errors.":[20],"As":[21],"the":[22],"complete":[23],"of":[25,58],"all":[26],"application":[27],"tasks":[28],"can":[29],"be":[30],"prohibitive":[31],"due":[32],"resource":[34],"costs,":[35],"introduce":[37],"programmer-directed":[38],"selective":[39],"mechanism":[41],"provide":[43],"fault-tolerance":[44],"while":[45],"decreasing":[46],"costs.":[47],"Results":[48],"show":[49],"that":[50],"our":[51],"scheme":[52],"detects":[53],"corrects":[55],"around":[56],"65%":[57],"SDC":[59],"errors":[60],"with":[61],"only":[62],"4%":[63],"overhead":[64],"on":[65],"average.":[66]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
