{"id":"https://openalex.org/W2048784665","doi":"https://doi.org/10.1145/1183401.1183406","title":"Cooperative checkpointing","display_name":"Cooperative checkpointing","publication_year":2006,"publication_date":"2006-06-28","ids":{"openalex":"https://openalex.org/W2048784665","doi":"https://doi.org/10.1145/1183401.1183406","mag":"2048784665"},"language":"en","primary_location":{"id":"doi:10.1145/1183401.1183406","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1183401.1183406","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 20th annual international conference on Supercomputing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063869378","display_name":"Adam J. Oliner","orcid":null},"institutions":[{"id":"https://openalex.org/I1743320","display_name":"Palo Alto University","ror":"https://ror.org/04f812k67","country_code":"US","type":"education","lineage":["https://openalex.org/I1743320"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Adam J. Oliner","raw_affiliation_strings":["Stanford University, Palo Alto, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Palo Alto, CA","institution_ids":["https://openalex.org/I1743320","https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112072124","display_name":"Larry Rudolph","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I4210110987","display_name":"IIT@MIT","ror":"https://ror.org/01wp8zh54","country_code":"US","type":"facility","lineage":["https://openalex.org/I30771326","https://openalex.org/I4210110987"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Larry Rudolph","raw_affiliation_strings":["MIT, CSAIL, Cambridge, MA","MIT - CSAIL, Cambridge, MA#TAB#"],"affiliations":[{"raw_affiliation_string":"MIT, CSAIL, Cambridge, MA","institution_ids":["https://openalex.org/I4210110987"]},{"raw_affiliation_string":"MIT - CSAIL, Cambridge, MA#TAB#","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111949082","display_name":"Ramendra K. Sahoo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramendra K. Sahoo","raw_affiliation_strings":["IBM, T. J. Watson Research Center, Hawthorne, NY"],"affiliations":[{"raw_affiliation_string":"IBM, T. J. Watson Research Center, Hawthorne, NY","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5063869378"],"corresponding_institution_ids":["https://openalex.org/I1743320","https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":7.5447,"has_fulltext":false,"cited_by_count":68,"citation_normalized_percentile":{"value":0.97410658,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"14","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8385494947433472},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.7885355949401855},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.672542154788971},{"id":"https://openalex.org/keywords/fault-tolerance","display_name":"Fault tolerance","score":0.6724405288696289},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.624593198299408},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6027523279190063},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5546348690986633},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.5186076164245605},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.43293461203575134},{"id":"https://openalex.org/keywords/job-scheduler","display_name":"Job scheduler","score":0.4131624102592468},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.41137826442718506},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.19613271951675415},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1235162615776062},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.11811041831970215},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.07740512490272522},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.060387223958969116}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8385494947433472},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.7885355949401855},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.672542154788971},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.6724405288696289},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.624593198299408},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6027523279190063},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5546348690986633},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.5186076164245605},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.43293461203575134},{"id":"https://openalex.org/C111873713","wikidata":"https://www.wikidata.org/wiki/Q1641413","display_name":"Job scheduler","level":3,"score":0.4131624102592468},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.41137826442718506},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.19613271951675415},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1235162615776062},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.11811041831970215},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.07740512490272522},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.060387223958969116},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1183401.1183406","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1183401.1183406","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 20th annual international conference on Supercomputing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.6499999761581421}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W64370538","https://openalex.org/W159719520","https://openalex.org/W1496940124","https://openalex.org/W1862835629","https://openalex.org/W1911403303","https://openalex.org/W1971952282","https://openalex.org/W2015651973","https://openalex.org/W2017838136","https://openalex.org/W2028133900","https://openalex.org/W2033656974","https://openalex.org/W2041250459","https://openalex.org/W2051965855","https://openalex.org/W2053691501","https://openalex.org/W2072915890","https://openalex.org/W2096020561","https://openalex.org/W2108686966","https://openalex.org/W2108992399","https://openalex.org/W2113052966","https://openalex.org/W2119018856","https://openalex.org/W2143220335","https://openalex.org/W2158907675","https://openalex.org/W2159762968","https://openalex.org/W2164569036","https://openalex.org/W2165022815","https://openalex.org/W2197919473","https://openalex.org/W6643050054","https://openalex.org/W7055024897"],"related_works":["https://openalex.org/W2153096481","https://openalex.org/W2148616436","https://openalex.org/W2102525122","https://openalex.org/W4245282135","https://openalex.org/W4306316843","https://openalex.org/W2130594209","https://openalex.org/W2036953450","https://openalex.org/W4300955944","https://openalex.org/W2170004886","https://openalex.org/W2527822502"],"abstract_inverted_index":{"Cooperative":[0,83],"checkpointing":[1,61,77,84,94],"increases":[2],"the":[3,40,79,126],"performance":[4],"and":[5,37,44,54,96,108],"robustness":[6],"of":[7,42,72,91,118,128],"a":[8,69,116],"system":[9,24],"by":[10,14],"allowing":[11],"checkpoints":[12],"requested":[13],"applications":[15],"to":[16,31,65,81,100,122],"be":[17,26,35,86,98],"dynamically":[18],"skipped":[19],"at":[20],"runtime.":[21],"A":[22,47],"robust":[23],"must":[25,34],"more":[27],"than":[28],"merely":[29],"resilient":[30],"failures;":[32],"it":[33],"adaptable":[36],"flexible":[38],"in":[39],"face":[41],"new":[43],"evolving":[45],"challenges.":[46],"simulation-based":[48],"experimental":[49],"analysis":[50],"using":[51],"both":[52],"probabilistic":[53],"harvested":[55],"failure":[56,73],"distributions":[57,74],"reveals":[58],"that":[59,75],"cooperative":[60,123],"enables":[62],"an":[63],"application":[64],"make":[66],"progress":[67],"under":[68],"wide":[70],"variety":[71],"periodic":[76,129],"lacks":[78],"flexibility":[80],"handle.":[82],"can":[85],"easily":[87],"implemented":[88],"on":[89],"top":[90],"existing":[92],"application-initiated":[93],"mechanisms":[95],"may":[97],"used":[99],"enhance":[101],"other":[102],"reliability":[103],"techniques":[104],"like":[105],"QoS":[106],"guarantees":[107],"fault-aware":[109],"job":[110],"scheduling.":[111],"The":[112],"simulations":[113],"also":[114],"support":[115],"number":[117],"theoretical":[119],"predictions":[120],"related":[121],"checkpointing,":[124],"including":[125],"non-competitiveness":[127],"checkpointing.":[130]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":5},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":8}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
