{"id":"https://openalex.org/W4404385652","doi":"https://doi.org/10.1145/3698038.3698507","title":"H2C-Dedup: Reducing I/O and GC Amplification for QLC SSDs from the Deduplication Metadata Perspective","display_name":"H2C-Dedup: Reducing I/O and GC Amplification for QLC SSDs from the Deduplication Metadata Perspective","publication_year":2024,"publication_date":"2024-11-14","ids":{"openalex":"https://openalex.org/W4404385652","doi":"https://doi.org/10.1145/3698038.3698507"},"language":"en","primary_location":{"id":"doi:10.1145/3698038.3698507","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3698038.3698507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Symposium on Cloud Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103401276","display_name":"Yunsheng Dong","orcid":"https://orcid.org/0009-0000-5004-013X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunsheng Dong","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024962616","display_name":"Bo-Sheng Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boju Chen","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059296415","display_name":"Yanqi Pan","orcid":"https://orcid.org/0009-0007-7832-0599"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanqi Pan","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021153181","display_name":"Xiangyu Zou","orcid":"https://orcid.org/0000-0001-5104-8301"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangyu Zou","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050928208","display_name":"Wen Xia","orcid":"https://orcid.org/0000-0003-4093-6391"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Xia","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Peng Cheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103401276"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":0.698,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.73523456,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"704","last_page":"719"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.9550999999046326,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-deduplication","display_name":"Data deduplication","score":0.9106829166412354},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.8734408020973206},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.7695001363754272},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.689023494720459},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3904915153980255},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3296715319156647},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.09358289837837219}],"concepts":[{"id":"https://openalex.org/C32587265","wikidata":"https://www.wikidata.org/wiki/Q1182260","display_name":"Data deduplication","level":2,"score":0.9106829166412354},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8734408020973206},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.7695001363754272},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.689023494720459},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3904915153980255},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3296715319156647},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.09358289837837219}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3698038.3698507","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3698038.3698507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Symposium on Cloud Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W178328500","https://openalex.org/W1967106146","https://openalex.org/W2029118431","https://openalex.org/W2126116376","https://openalex.org/W2129610259","https://openalex.org/W2147407897","https://openalex.org/W2169711736","https://openalex.org/W2221799239","https://openalex.org/W2289555345","https://openalex.org/W2475932436","https://openalex.org/W2492590231","https://openalex.org/W2901347649","https://openalex.org/W2916086000","https://openalex.org/W2951313701","https://openalex.org/W2962814013","https://openalex.org/W2964142687","https://openalex.org/W2986445348","https://openalex.org/W3008170349","https://openalex.org/W3098486933","https://openalex.org/W3178257743","https://openalex.org/W4312543403","https://openalex.org/W4312554896","https://openalex.org/W4312996182","https://openalex.org/W4327710063","https://openalex.org/W4387321103","https://openalex.org/W4389166743"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3144870715","https://openalex.org/W3142319788","https://openalex.org/W2587188779","https://openalex.org/W3132870970","https://openalex.org/W4385804830","https://openalex.org/W2943088381","https://openalex.org/W2074021203","https://openalex.org/W2144348063"],"abstract_inverted_index":{"QLC":[0,41],"SSDs":[1],"have":[2],"gained":[3],"increasing":[4],"popularity":[5],"in":[6],"cloud":[7],"computing,":[8],"PCs,":[9],"and":[10,17,83,88,173,188,208,225,237,243,250],"smartphones":[11],"due":[12,70,95],"to":[13,39,71,96,123,150,158,169,176,184,233,248],"their":[14],"low":[15],"prices":[16],"high":[18],"density,":[19],"but":[20],"they":[21,196],"suffer":[22],"from":[23,64],"extremely":[24],"limited":[25],"endurance.":[26],"Deduplication":[27],"can":[28,231],"convert":[29],"redundant":[30,102],"chunk":[31],"writes":[32],"into":[33,166],"fine-grained":[34],"metadata":[35,85,98,132,140,165,190],"updates,":[36],"thereby":[37],"promising":[38],"alleviate":[40],"wear.":[42],"Nevertheless,":[43],"our":[44],"observation":[45],"shows":[46],"that":[47,60,137,229],"existing":[48],"deduplication":[49,84,97,139],"approaches":[50],"cause":[51],"even":[52],"more":[53],"I/Os":[54],"than":[55],"non-deduplication":[56],"systems.":[57],"We":[58,211],"find":[59],"the":[61,72,110,138,153,181,205,220],"amplification":[62,69,94],"comes":[63],"two":[65,119],"sources:":[66],"(1)":[67],"I/O":[68,77,86,125,133,148,155,207,245],"mismatched":[73],"granularity":[74],"between":[75],"SSD":[76,90],"size":[78],"(e.g.,":[79,168,175],"4--16":[80],"KiB":[81],"page)":[82],"size,":[87],"(2)":[89],"garbage":[91],"collection":[92],"(GC)":[93],"updates":[99],"for":[100],"eliminating":[101],"chunks":[103],"(i.e.,":[104],"increment":[105],"reference":[106,171],"count).":[107],"To":[108],"address":[109,124,159],"above":[111],"problem,":[112],"this":[113],"paper":[114],"proposes":[115],"H2C-Dedup,":[116],"which":[117,135],"employs":[118],"essential":[120],"techniques.":[121],"First,":[122],"amplification,":[126,161],"cold2hot-heating":[127],"technique":[128,163],"utilizes":[129],"a":[130,200],"log-structured":[131],"scheme,":[134],"ensures":[136],"is":[141,145],"flushed":[142],"until":[143],"it":[144],"accumulated":[146],"within":[147],"cache":[149],"match":[151],"with":[152],"OS":[154],"granularity.":[156],"Second,":[157],"GC":[160,209],"hot2cold-suppression":[162],"divides":[164],"hot":[167,182,187],"store":[170,177],"count)":[172],"cold":[174,189],"fingerprint)":[178],"segments,":[179],"delta-encoding":[180],"entries":[183],"ensure":[185],"both":[186],"will":[191],"not":[192],"be":[193],"modified":[194],"once":[195],"are":[197],"durable.":[198],"As":[199],"result,":[201],"H2C-Dedup":[202,213,230],"significantly":[203],"reduces":[204],"deduplication-induced":[206],"amplification.":[210],"implement":[212],"based":[214],"on":[215,219],"F2FS.":[216],"Extensive":[217],"experiments":[218],"FEMU":[221],"platform":[222],"using":[223],"microbenchmarks":[224],"real-world":[226],"traces":[227],"indicate":[228],"extend":[232],"at":[234],"most":[235],"3.3\u00d7":[236],"3.4\u00d7":[238],"lifespan":[239],"while":[240],"accelerating":[241],"26%":[242],"37%":[244],"performance":[246],"compared":[247],"SmartDedup":[249],"HF-Dedupe.":[251]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
