{"id":"https://openalex.org/W2908016640","doi":"https://doi.org/10.1109/pais.2018.8598484","title":"Fault Tolerance in Distributed Systems: A Survey","display_name":"Fault Tolerance in Distributed Systems: A Survey","publication_year":2018,"publication_date":"2018-10-01","ids":{"openalex":"https://openalex.org/W2908016640","doi":"https://doi.org/10.1109/pais.2018.8598484","mag":"2908016640"},"language":"en","primary_location":{"id":"doi:10.1109/pais.2018.8598484","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pais.2018.8598484","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 3rd International Conference on Pattern Analysis and Intelligent Systems (PAIS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000292833","display_name":"Abdeldjalil Ledmi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210095290","display_name":"Universit\u00e9 Larbi T\u00e9bessi","ror":"https://ror.org/00tnac320","country_code":"DZ","type":"education","lineage":["https://openalex.org/I4210095290"]}],"countries":["DZ"],"is_corresponding":false,"raw_author_name":"Abdeldjalil Ledmi","raw_affiliation_strings":["Laboratory of Mathematics, Informatics and Systems (LAMIS), University of Larbi, Tebessi, Tebessa, ALGERIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratory of Mathematics, Informatics and Systems (LAMIS), University of Larbi, Tebessi, Tebessa, ALGERIA","institution_ids":["https://openalex.org/I4210095290"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001584330","display_name":"Hakim Bendjenna","orcid":"https://orcid.org/0000-0003-0352-6617"},"institutions":[{"id":"https://openalex.org/I4210095290","display_name":"Universit\u00e9 Larbi T\u00e9bessi","ror":"https://ror.org/00tnac320","country_code":"DZ","type":"education","lineage":["https://openalex.org/I4210095290"]}],"countries":["DZ"],"is_corresponding":false,"raw_author_name":"Hakim Bendjenna","raw_affiliation_strings":["Laboratory of Mathematics, Informatics and Systems (LAMIS), University of Larbi, Tebessi, Tebessa, ALGERIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratory of Mathematics, Informatics and Systems (LAMIS), University of Larbi, Tebessi, Tebessa, ALGERIA","institution_ids":["https://openalex.org/I4210095290"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044478313","display_name":"Sofiane Mounine Hemam","orcid":"https://orcid.org/0000-0002-9638-8390"},"institutions":[{"id":"https://openalex.org/I4210130929","display_name":"Abb\u00e8s Laghrour University of Khenchela","ror":"https://ror.org/02yyskm09","country_code":"DZ","type":"education","lineage":["https://openalex.org/I4210130929"]}],"countries":["DZ"],"is_corresponding":false,"raw_author_name":"Sofiane Mounine Hemam","raw_affiliation_strings":["ICOSI Laaboratory, Khenchela University, Khenchela, Algeria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ICOSI Laaboratory, Khenchela University, Khenchela, Algeria","institution_ids":["https://openalex.org/I4210130929"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3835,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.84173179,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8034229278564453},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.7668255567550659},{"id":"https://openalex.org/keywords/fault-tolerance","display_name":"Fault tolerance","score":0.7284571528434753},{"id":"https://openalex.org/keywords/software-fault-tolerance","display_name":"Software fault tolerance","score":0.6814450621604919},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.5631940364837646},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.5478437542915344},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.47436532378196716},{"id":"https://openalex.org/keywords/grid-computing","display_name":"Grid computing","score":0.4378148317337036},{"id":"https://openalex.org/keywords/reliability-engineering","display_name":"Reliability engineering","score":0.35196447372436523},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.15966767072677612},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.13082167506217957},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11114296317100525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8034229278564453},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.7668255567550659},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.7284571528434753},{"id":"https://openalex.org/C50712370","wikidata":"https://www.wikidata.org/wiki/Q4269346","display_name":"Software fault tolerance","level":3,"score":0.6814450621604919},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.5631940364837646},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.5478437542915344},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.47436532378196716},{"id":"https://openalex.org/C70429105","wikidata":"https://www.wikidata.org/wiki/Q249999","display_name":"Grid computing","level":3,"score":0.4378148317337036},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.35196447372436523},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.15966767072677612},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.13082167506217957},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11114296317100525},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/pais.2018.8598484","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pais.2018.8598484","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 3rd International Conference on Pattern Analysis and Intelligent Systems (PAIS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.44999998807907104,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W21025594","https://openalex.org/W1488150418","https://openalex.org/W1493735863","https://openalex.org/W1508143344","https://openalex.org/W1555993967","https://openalex.org/W1848882129","https://openalex.org/W2039445823","https://openalex.org/W2049008806","https://openalex.org/W2064651666","https://openalex.org/W2092524537","https://openalex.org/W2118655063","https://openalex.org/W2119341411","https://openalex.org/W2171453084","https://openalex.org/W2786111694","https://openalex.org/W3014366097","https://openalex.org/W4231972924","https://openalex.org/W4323053766","https://openalex.org/W6629805146"],"related_works":["https://openalex.org/W1824707887","https://openalex.org/W2068583628","https://openalex.org/W169905258","https://openalex.org/W2013271762","https://openalex.org/W1570043218","https://openalex.org/W3146449452","https://openalex.org/W2162684709","https://openalex.org/W2147457882","https://openalex.org/W2115770466","https://openalex.org/W2111726532"],"abstract_inverted_index":{"Distributed":[0],"systems":[1,124,153],"can":[2,16],"be":[3],"homogeneous":[4],"(cluster),":[5],"or":[6,51],"heterogeneous":[7],"such":[8,23,154],"as":[9,24],"Grid,":[10],"Cloud":[11,159],"and":[12,33,62,104,125,145,160],"P2P.":[13],"Several":[14],"problems":[15],"occur":[17],"in":[18,55,66,72,83,132,149],"these":[19,87,99,107],"types":[20],"of":[21,26,45,86,98,118,122,152],"systems,":[22],"quality":[25],"service":[27],"(QoS),":[28],"resource":[29],"selection,":[30],"load":[31],"balancing":[32],"fault":[34],"tolerance.":[35],"Fault":[36],"tolerance":[37],"is":[38,101],"a":[39,49,60,69,133],"main":[40],"subject":[41],"regarding":[42],"the":[43,56,76,84,96,119,136],"design":[44],"distributed":[46,123],"systems.":[47,162],"When":[48],"hardware":[50],"software":[52],"failure":[53,61],"occurs":[54],"system,":[57],"it":[58],"causes":[59],"we":[63,112,130],"call":[64],"it,":[65],"this":[67,110],"case,":[68],"fault.":[70],"Moreover,":[71],"order":[73],"to":[74,78,102,105,143,146],"allow":[75],"system":[77],"continue":[79],"its":[80],"functionalities,":[81],"even":[82],"presence":[85],"faults,":[88],"they":[89],"must":[90],"find":[91],"techniques,":[92],"which":[93],"tolerate":[94,140],"failure;":[95],"goal":[97],"techniques":[100,138],"detect":[103],"correct":[106,147],"errors.":[108],"In":[109],"paper,":[111],"introduce":[113],"at":[114],"first":[115],"an":[116],"overview":[117],"basic":[120],"concepts":[121],"their":[126],"failures":[127],"types,":[128],"then":[129],"present,":[131],"detailed":[134],"manner,":[135],"different":[137,150],"that":[139],"fault,":[141],"used":[142],"identify":[144],"faults":[148],"kinds":[151],"as:":[155],"cluster,":[156],"grid":[157],"computing,":[158],"P2P":[161]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
