{"id":"https://openalex.org/W2912893741","doi":"https://doi.org/10.1109/tpds.2019.2898942","title":"PFP: Improving the Reliability of Deduplication-based Storage Systems with Per-File Parity","display_name":"PFP: Improving the Reliability of Deduplication-based Storage Systems with Per-File Parity","publication_year":2019,"publication_date":"2019-02-12","ids":{"openalex":"https://openalex.org/W2912893741","doi":"https://doi.org/10.1109/tpds.2019.2898942","mag":"2912893741"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2019.2898942","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2019.2898942","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100743604","display_name":"Suzhen Wu","orcid":"https://orcid.org/0000-0002-3589-9621"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Suzhen Wu","raw_affiliation_strings":["Computer Science Department, Xiamen University, Xiamen, Fujian, China"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Xiamen University, Xiamen, Fujian, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003486125","display_name":"Bo Mao","orcid":"https://orcid.org/0000-0002-4819-4583"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Mao","raw_affiliation_strings":["Software School, Xiamen University, Xiamen, Fujian, China"],"affiliations":[{"raw_affiliation_string":"Software School, Xiamen University, Xiamen, Fujian, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054285749","display_name":"Hong Jiang","orcid":"https://orcid.org/0000-0002-1477-9751"},"institutions":[{"id":"https://openalex.org/I189196454","display_name":"The University of Texas at Arlington","ror":"https://ror.org/019kgqr73","country_code":"US","type":"education","lineage":["https://openalex.org/I189196454"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hong Jiang","raw_affiliation_strings":["Computer Science and Engineering Department, University of Texas at Arlington, Arlington, TX, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Department, University of Texas at Arlington, Arlington, TX, USA","institution_ids":["https://openalex.org/I189196454"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082887535","display_name":"Huagao Luan","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huagao Luan","raw_affiliation_strings":["Computer Science Department, Xiamen University, Xiamen, Fujian, China"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Xiamen University, Xiamen, Fujian, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004740719","display_name":"Jindong Zhou","orcid":"https://orcid.org/0000-0001-7656-7722"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jindong Zhou","raw_affiliation_strings":["Software School, Xiamen University, Xiamen, Fujian, China"],"affiliations":[{"raw_affiliation_string":"Software School, Xiamen University, Xiamen, Fujian, China","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100743604"],"corresponding_institution_ids":["https://openalex.org/I191208505"],"apc_list":null,"apc_paid":null,"fwci":1.2379,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.80710241,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"30","issue":"9","first_page":"2117","last_page":"2129"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-deduplication","display_name":"Data deduplication","score":0.9208447933197021},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8710345029830933},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6724755764007568},{"id":"https://openalex.org/keywords/chunking","display_name":"Chunking (psychology)","score":0.5746712684631348},{"id":"https://openalex.org/keywords/raid","display_name":"RAID","score":0.511347234249115},{"id":"https://openalex.org/keywords/computer-data-storage","display_name":"Computer data storage","score":0.4282572269439697},{"id":"https://openalex.org/keywords/file-system","display_name":"File system","score":0.4237516522407532},{"id":"https://openalex.org/keywords/data-redundancy","display_name":"Data redundancy","score":0.41888517141342163},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.4173800051212311},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3523138761520386},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.19772931933403015}],"concepts":[{"id":"https://openalex.org/C32587265","wikidata":"https://www.wikidata.org/wiki/Q1182260","display_name":"Data deduplication","level":2,"score":0.9208447933197021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8710345029830933},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6724755764007568},{"id":"https://openalex.org/C203357204","wikidata":"https://www.wikidata.org/wiki/Q1089605","display_name":"Chunking (psychology)","level":2,"score":0.5746712684631348},{"id":"https://openalex.org/C133320665","wikidata":"https://www.wikidata.org/wiki/Q179299","display_name":"RAID","level":2,"score":0.511347234249115},{"id":"https://openalex.org/C194739806","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Computer data storage","level":2,"score":0.4282572269439697},{"id":"https://openalex.org/C2780940931","wikidata":"https://www.wikidata.org/wiki/Q174989","display_name":"File system","level":2,"score":0.4237516522407532},{"id":"https://openalex.org/C7545210","wikidata":"https://www.wikidata.org/wiki/Q838123","display_name":"Data redundancy","level":2,"score":0.41888517141342163},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.4173800051212311},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3523138761520386},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.19772931933403015},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2019.2898942","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2019.2898942","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2184068523","display_name":null,"funder_award_id":"U1705261","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3374635623","display_name":null,"funder_award_id":"CCF-1629625","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4387056415","display_name":null,"funder_award_id":"CCF-1704504","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G529135757","display_name":null,"funder_award_id":"61872305","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6708825637","display_name":null,"funder_award_id":"61472336","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8257308584","display_name":null,"funder_award_id":"61772439","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W6847055","https://openalex.org/W11345677","https://openalex.org/W22807665","https://openalex.org/W126194223","https://openalex.org/W182307532","https://openalex.org/W200233886","https://openalex.org/W1418704970","https://openalex.org/W1541467180","https://openalex.org/W1542686980","https://openalex.org/W1599186236","https://openalex.org/W1965572530","https://openalex.org/W1965751562","https://openalex.org/W1971212200","https://openalex.org/W1979162731","https://openalex.org/W1984731420","https://openalex.org/W1988161332","https://openalex.org/W1988596907","https://openalex.org/W1996496158","https://openalex.org/W2022636838","https://openalex.org/W2043719859","https://openalex.org/W2047439460","https://openalex.org/W2055899630","https://openalex.org/W2123438830","https://openalex.org/W2125165932","https://openalex.org/W2138872609","https://openalex.org/W2156468933","https://openalex.org/W2161234420","https://openalex.org/W2277915713","https://openalex.org/W2401572102","https://openalex.org/W2418682648","https://openalex.org/W2475932436","https://openalex.org/W2528460538","https://openalex.org/W2592873330","https://openalex.org/W2604501166","https://openalex.org/W2752311492","https://openalex.org/W2993345055","https://openalex.org/W6600453592","https://openalex.org/W6600884019","https://openalex.org/W6605053430","https://openalex.org/W6607453207","https://openalex.org/W6608138927","https://openalex.org/W6628219055","https://openalex.org/W6632555794","https://openalex.org/W6678803342","https://openalex.org/W6683682350","https://openalex.org/W6695128442","https://openalex.org/W6717023391","https://openalex.org/W6734566231","https://openalex.org/W6771325250"],"related_works":["https://openalex.org/W2540788271","https://openalex.org/W2077135008","https://openalex.org/W4378228047","https://openalex.org/W2297121304","https://openalex.org/W2528460538","https://openalex.org/W4312090360","https://openalex.org/W4297789611","https://openalex.org/W2378607723","https://openalex.org/W3141722062","https://openalex.org/W2912893741"],"abstract_inverted_index":{"Data":[0],"deduplication":[1],"weakens":[2],"the":[3,37,55,123,155,163,176,181,234,275],"reliability":[4,56,141,156,214],"of":[5,39,125,157,169,172,227,269],"storage":[6,60,159,277],"systems":[7,61],"since":[8],"by":[9,78,196,210],"design":[10],"it":[11],"removes":[12],"duplicate":[13],"data":[14,44,70,82,95,107,129,170,182,204,246,255],"chunks":[15,85,108,171,183,205],"common":[16],"to":[17,24,119,153,274],"different":[18],"files":[19,23,52,73,117,195],"and":[20,127,199,216,239,249],"forces":[21],"these":[22,100],"share":[25],"a":[26,40,146,200,224,259],"single":[27,41],"physical":[28],"date":[29],"chunk,":[30,33],"or":[31,90],"critical":[32,43,81],"after":[34,72,175],"deduplication.":[35],"Thus,":[36],"loss":[38],"such":[42,132],"chunk":[45,130,247,256],"can":[46,114,188],"potentially":[47],"render":[48],"all":[49,194],"referencing":[50],"(sharing)":[51],"unavailable.":[53],"However,":[54],"issue":[57],"in":[58,122,241],"deduplication-based":[59,158,276],"has":[62],"not":[63],"received":[64],"adequate":[65],"attention.":[66],"Existing":[67],"approaches":[68],"introduce":[69],"redundancy":[71,191,236],"have":[74],"been":[75],"deduplicated,":[76],"either":[77],"replication":[79],"on":[80,93,104,223],"chunks,":[83,96],"i.e.,":[84],"with":[86,206],"high":[87,207],"reference":[88,208],"count,":[89],"RAID":[91],"schemes":[92,101],"unique":[94,106],"which":[97],"means":[98],"that":[99,230,263],"are":[102,184],"based":[103,220],"individual":[105,111,116],"rather":[109],"than":[110],"files.":[112],"This":[113],"leave":[115],"vulnerable":[118],"losses,":[120],"particularly":[121],"presence":[124],"transient":[126],"unrecoverable":[128],"errors":[131],"as":[133],"latent":[134],"sector":[135],"errors.":[136],"To":[137],"address":[138],"this":[139,143],"file":[140,174,251],"issue,":[142],"paper":[144],"proposes":[145],"Per-File":[147],"Parity":[148],"(short":[149],"for":[150,193,203],"PFP)":[151],"scheme":[152],"improve":[154],"systems.":[160],"PFP":[161,187,228,231,264],"computes":[162],"XOR":[164],"parity":[165,167,190],"within":[166],"groups":[168],"each":[173],"chunking":[177],"process":[178],"but":[179],"before":[180],"deduplicated.":[185],"Therefore,":[186],"provide":[189],"protection":[192,202],"intra-file":[197],"recovery":[198],"higher-level":[201],"counts":[209],"inter-file":[211],"recovery.":[212],"Our":[213],"analysis":[215],"extensive":[217],"data-driven,":[218],"failure-injection":[219],"experiments":[221],"conducted":[222],"prototype":[225],"implementation":[226],"show":[229],"significantly":[232],"outperforms":[233],"existing":[235],"solutions,":[237],"DTR":[238],"RCR,":[240],"system":[242],"reliability,":[243],"tolerating":[244],"multiple":[245,254],"failures":[248],"guaranteeing":[250],"availability":[252],"upon":[253],"failures.":[257],"Moreover,":[258],"performance":[260,272],"evaluation":[261],"shows":[262],"only":[265],"incurs":[266],"an":[267],"average":[268],"5.7":[270],"percent":[271],"degradation":[273],"system.":[278]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
