{"id":"https://openalex.org/W7151307211","doi":"https://doi.org/10.1109/icmla66185.2025.00196","title":"HierTTF: Hierarchical Two-Stage Time-to-Failure Prediction for Datacenter SSDs Using Telemetry","display_name":"HierTTF: Hierarchical Two-Stage Time-to-Failure Prediction for Datacenter SSDs Using Telemetry","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7151307211","doi":"https://doi.org/10.1109/icmla66185.2025.00196"},"language":null,"primary_location":{"id":"doi:10.1109/icmla66185.2025.00196","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090527393","display_name":"Geunrok Oh","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Geunrok Oh","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133092479","display_name":"Sohyun Han","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sohyun Han","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133126228","display_name":"Kijong You","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kijong You","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082923106","display_name":"Jongsung Na","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jongsung Na","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133065678","display_name":"Kyungsik Song","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kyungsik Song","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106525956","display_name":"Sejeong Jang","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sejeong Jang","raw_affiliation_strings":["Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Device Solution, Memory Business,Hwaseong,Republic of Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133078937","display_name":"Yuqi Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yuqi Zhang","raw_affiliation_strings":["Samsung Electronics,Samsung R&#x0026;D Institute China Xi&#x2019;an,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Samsung R&#x0026;D Institute China Xi&#x2019;an,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5133147659","display_name":"Haonan Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Haonan Luo","raw_affiliation_strings":["Samsung Electronics,Samsung R&#x0026;D Institute China Xi&#x2019;an,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics,Samsung R&#x0026;D Institute China Xi&#x2019;an,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I2250650973"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5090527393"],"corresponding_institution_ids":["https://openalex.org/I2250650973"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.78204628,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1285","last_page":"1290"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.0013000000035390258,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.0006000000284984708,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/telemetry","display_name":"Telemetry","score":0.4142000079154968},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3163999915122986},{"id":"https://openalex.org/keywords/data-transmission","display_name":"Data transmission","score":0.25450000166893005},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.2264000028371811}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5932000279426575},{"id":"https://openalex.org/C183121708","wikidata":"https://www.wikidata.org/wiki/Q209867","display_name":"Telemetry","level":2,"score":0.4142000079154968},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3734999895095825},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3163999915122986},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2937000095844269},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.25450000166893005},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.24160000681877136},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2264000028371811},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.22509999573230743},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.2214999943971634}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmla66185.2025.00196","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1498436455","https://openalex.org/W2064675550","https://openalex.org/W2112796928","https://openalex.org/W2131774270","https://openalex.org/W2295598076","https://openalex.org/W2950635152","https://openalex.org/W2980994438","https://openalex.org/W3147894994","https://openalex.org/W4200191783","https://openalex.org/W4385245566","https://openalex.org/W4400762160"],"related_works":[],"abstract_inverted_index":{"Storage":[0],"reliability":[1,219],"is":[2],"mission-critical":[3],"in":[4,147,202,214,217],"cloud":[5],"and":[6,18,38,43,78,130,158,170,184,210,220],"data-center":[7],"environments,":[8],"yet":[9],"unexpected":[10],"storage":[11,28,54],"failures":[12],"still":[13],"cause":[14],"outages,":[15],"operational":[16,218],"overhead,":[17],"data":[19,204,208],"loss.":[20],"This":[21,66],"has":[22,199],"driven":[23],"ongoing":[24],"efforts":[25],"to":[26,31,75,104,121],"predict":[27,61],"failures,":[29],"leading":[30],"threshold-based":[32],"methods":[33,48],"that":[34],"use":[35],"self-monitoring,":[36],"analysis,":[37],"reporting":[39],"technology":[40],"(SMART)":[41],"statistics":[42],"binary":[44],"classifiers.":[45],"However,":[46],"these":[47],"can":[49],"only":[50],"indicate":[51],"whether":[52],"a":[53,88,98,117,176],"drive":[55,211],"may":[56],"fail,":[57],"but":[58],"do":[59],"not":[60],"when":[62],"failure":[63],"will":[64],"occur.":[65],"limitation":[67],"highlights":[68],"the":[69,122,126,192,195],"need":[70],"for":[71,92],"time-to-failure":[72],"(TTF)":[73],"forecasting":[74],"enable":[76],"proactive":[77,207],"risk-aware":[79],"maintenance.":[80],"To":[81],"overcome":[82],"this":[83],"limitation,":[84],"we":[85],"propose":[86],"HierTTF,":[87],"hierarchical":[89,196],"two-stage":[90],"framework":[91],"TTF":[93,128],"prediction.":[94],"Stage":[95,114,150,159],"1":[96,151],"uses":[97],"CNN-LSTM":[99],"classifier":[100],"with":[101,175],"multi-head":[102],"attention":[103],"screen":[105],"drives":[106],"at":[107,155],"risk":[108],"of":[109,194],"failing":[110],"within":[111],"14":[112],"days.":[113,173],"2":[115,160],"applies":[116],"DeepAR-based":[118],"probabilistic":[119],"forecaster":[120],"screened":[123],"cohort,":[124],"yielding":[125],"conditional":[127],"distribution":[129],"95%":[131],"prediction":[132],"intervals.":[133],"We":[134],"validate":[135],"HierTTF":[136,179,198],"on":[137],"more":[138],"than":[139],"5":[140],"million":[141],"enterprise":[142],"SSDs":[143],"over":[144],"28":[145],"months":[146],"real-world":[148,203],"datacenters.":[149],"attains":[152],"84.8%":[153],"precision":[154],"74.7%":[156],"recall,":[157],"achieves":[161],"MAE":[162,181],"0.918":[163],"days,":[164],"R<sup":[165,186],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[166,187],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[167,188],"=":[168],"0.928":[169],"CRPS":[171],"0.85":[172],"Compared":[174],"non-hierarchical":[177],"model,":[178],"cuts":[180],"by":[182,189],"76.7%":[183],"raises":[185],"0.556,":[190],"demonstrating":[191],"value":[193],"approach.":[197],"been":[200],"deployed":[201],"centers,":[205],"supporting":[206],"migration":[209],"replacement,":[212],"resulting":[213],"measurable":[215],"improvements":[216],"efficiency":[221]},"counts_by_year":[],"updated_date":"2026-04-09T06:08:40.794217","created_date":"2026-04-08T00:00:00"}
