{"id":"https://openalex.org/W4389628352","doi":"https://doi.org/10.1145/3626785","title":"HEAL: Performance Troubleshooting Deep inside Data Center Hosts","display_name":"HEAL: Performance Troubleshooting Deep inside Data Center Hosts","publication_year":2023,"publication_date":"2023-12-07","ids":{"openalex":"https://openalex.org/W4389628352","doi":"https://doi.org/10.1145/3626785"},"language":"en","primary_location":{"id":"doi:10.1145/3626785","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626785","pdf_url":null,"source":{"id":"https://openalex.org/S4210193547","display_name":"Proceedings of the ACM on Measurement and Analysis of Computing Systems","issn_l":"2476-1249","issn":["2476-1249"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Measurement and Analysis of Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037507957","display_name":"Yicheng Pan","orcid":"https://orcid.org/0000-0003-4139-1477"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yicheng Pan","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006129839","display_name":"Yang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang Zhang","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059295946","display_name":"Tingzhu Bi","orcid":"https://orcid.org/0000-0003-0366-0410"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingzhu Bi","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037621362","display_name":"Linlin Han","orcid":"https://orcid.org/0000-0002-4714-2634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Linlin Han","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082859077","display_name":"Yu Zhang","orcid":"https://orcid.org/0000-0003-4334-5159"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu Zhang","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100762316","display_name":"Meng Ma","orcid":"https://orcid.org/0000-0002-1963-2513"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Ma","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045580175","display_name":"X. Y. Shen","orcid":"https://orcid.org/0009-0004-9321-4442"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiangzhuang Shen","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069364644","display_name":"Xinrui Jiang","orcid":"https://orcid.org/0000-0003-1591-0480"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinrui Jiang","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071877363","display_name":"Feng Wang","orcid":"https://orcid.org/0009-0001-3981-8163"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng Wang","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002345641","display_name":"Xian Liu","orcid":"https://orcid.org/0000-0002-7332-0449"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xian Liu","raw_affiliation_strings":["ByteDance Inc., Beijing , China"],"affiliations":[{"raw_affiliation_string":"ByteDance Inc., Beijing , China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100338689","display_name":"Ping Wang","orcid":"https://orcid.org/0000-0002-8854-2079"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Wang","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5037507957"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20734858,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":"3","first_page":"1","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.800966739654541},{"id":"https://openalex.org/keywords/host","display_name":"Host (biology)","score":0.7848528623580933},{"id":"https://openalex.org/keywords/troubleshooting","display_name":"Troubleshooting","score":0.7723817825317383},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.748253345489502},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6201283931732178},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.5586733818054199},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4832923710346222},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4516604542732239},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.41397035121917725},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.40257835388183594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3269273042678833},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.10688415169715881}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.800966739654541},{"id":"https://openalex.org/C126831891","wikidata":"https://www.wikidata.org/wiki/Q221673","display_name":"Host (biology)","level":2,"score":0.7848528623580933},{"id":"https://openalex.org/C147494362","wikidata":"https://www.wikidata.org/wiki/Q2078905","display_name":"Troubleshooting","level":2,"score":0.7723817825317383},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.748253345489502},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6201283931732178},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.5586733818054199},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4832923710346222},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4516604542732239},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.41397035121917725},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.40257835388183594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3269273042678833},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.10688415169715881},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3626785","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626785","pdf_url":null,"source":{"id":"https://openalex.org/S4210193547","display_name":"Proceedings of the ACM on Measurement and Analysis of Computing Systems","issn_l":"2476-1249","issn":["2476-1249"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Measurement and Analysis of Computing Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1833690888","display_name":null,"funder_award_id":"62072006","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2238413409","display_name":null,"funder_award_id":"62072006,92167104","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G253385302","display_name":null,"funder_award_id":"92167104","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3011155338","display_name":null,"funder_award_id":"202102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4378010139","display_name":null,"funder_award_id":"201079","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6274316903","display_name":null,"funder_award_id":"2167104","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8375917964","display_name":null,"funder_award_id":"202102010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1967903840","https://openalex.org/W1975062332","https://openalex.org/W2028604378","https://openalex.org/W2085392455","https://openalex.org/W2110699951","https://openalex.org/W2123967542","https://openalex.org/W2161020850","https://openalex.org/W2167482691","https://openalex.org/W2181523240","https://openalex.org/W2322013807","https://openalex.org/W2563693940","https://openalex.org/W2770712100","https://openalex.org/W2821372324","https://openalex.org/W2884025810","https://openalex.org/W2903799441","https://openalex.org/W2954234386","https://openalex.org/W2965838158","https://openalex.org/W2966971704","https://openalex.org/W3006026125","https://openalex.org/W3022004659","https://openalex.org/W3080401329","https://openalex.org/W3149216967","https://openalex.org/W3155949183","https://openalex.org/W3170548061","https://openalex.org/W3194035167","https://openalex.org/W4251967167","https://openalex.org/W4290927880","https://openalex.org/W4318830451"],"related_works":["https://openalex.org/W3013479934","https://openalex.org/W4210597238","https://openalex.org/W4318325534","https://openalex.org/W4206476896","https://openalex.org/W4240398146","https://openalex.org/W2950310564","https://openalex.org/W4238338086","https://openalex.org/W2467308209","https://openalex.org/W2913357653","https://openalex.org/W1981753479"],"abstract_inverted_index":{"This":[0],"study":[1],"demonstrates":[2],"the":[3,33,51,55,65,69,93,146],"salient":[4],"facts":[5],"and":[6,41,54,99,114,142,158,162],"challenges":[7],"of":[8,22,95],"host":[9,17,34,77,89],"failure":[10,66],"operations":[11,161],"in":[12,86,130],"hyperscale":[13],"data":[14,156],"centers.":[15],"A":[16],"incident":[18],"can":[19,104],"involve":[20],"hundreds":[21],"distinct":[23],"host-level":[24],"metrics,":[25],"covering":[26],"broad":[27],"aspects.":[28],"The":[29],"faulting":[30],"mechanism":[31,67],"inside":[32,68],"connects":[35],"these":[36,59,118,150],"heterogeneous":[37,88],"metrics":[38,78,90],"through":[39],"direct":[40],"indirect":[42],"correlation,":[43],"making":[44],"it":[45],"extremely":[46],"difficult":[47],"to":[48,165],"sort":[49],"out":[50],"propagation":[52],"procedures":[53],"root":[56],"cause":[57],"from":[58,111],"intertwined":[60],"indicators.":[61],"To":[62],"deeply":[63],"understand":[64],"host,":[70],"we":[71],"develop":[72],"HEAL":[73,81,121,136,152],"--":[74],"a":[75],"novel":[76],"analysis":[79],"toolkit.":[80],"synergistically":[82],"discovers":[83],"dynamic":[84],"causality":[85],"sparse":[87],"by":[91],"combining":[92],"strengths":[94],"both":[96],"time":[97],"series":[98],"random":[100],"variable":[101],"analysis.":[102],"It":[103],"also":[105],"proactively":[106],"extract":[107],"causal":[108],"directional":[109],"hints":[110],"causality's":[112],"asymmetry":[113],"historical":[115],"knowledge.":[116],"Together,":[117],"breakthroughs":[119],"help":[120],"produce":[122],"accurate":[123],"results":[124],"given":[125],"undesirable":[126],"inputs.":[127],"Extensive":[128],"experiments":[129],"our":[131,155],"production":[132],"environment":[133],"verify":[134],"that":[135],"provides":[137],"significantly":[138],"better":[139],"result":[140],"accuracy":[141],"full-process":[143],"interpretability":[144],"than":[145],"SOTA":[147],"baselines.":[148],"With":[149],"advantages,":[151],"successfully":[153],"serves":[154],"center":[157],"worldwide":[159],"product":[160],"impressively":[163],"contributes":[164],"many":[166],"other":[167],"workflows.":[168]},"counts_by_year":[],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
