{"id":"https://openalex.org/W7155542296","doi":"https://doi.org/10.1145/3767295.3803614","title":"Proactive Change Risk Detection in Production Cloud Systems: ByteDance\u2019s Experience","display_name":"Proactive Change Risk Detection in Production Cloud Systems: ByteDance\u2019s Experience","publication_year":2026,"publication_date":"2026-04-24","ids":{"openalex":"https://openalex.org/W7155542296","doi":"https://doi.org/10.1145/3767295.3803614"},"language":null,"primary_location":{"id":"doi:10.1145/3767295.3803614","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767295.3803614","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 21st European Conference on Computer Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3767295.3803614","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134490163","display_name":"Jinyang Liu","orcid":"https://orcid.org/0000-0003-0037-1912"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jinyang Liu","raw_affiliation_strings":["ByteDance, San Jose, USA"],"raw_orcid":"https://orcid.org/0000-0003-0037-1912","affiliations":[{"raw_affiliation_string":"ByteDance, San Jose, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100426730","display_name":"Yichen Li","orcid":"https://orcid.org/0009-0009-8370-644X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yichen Li","raw_affiliation_strings":["ByteDance, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0009-8370-644X","affiliations":[{"raw_affiliation_string":"ByteDance, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134501412","display_name":"Tieying Zhang","orcid":"https://orcid.org/0009-0003-2250-5528"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tieying Zhang","raw_affiliation_strings":["ByteDance, San Jose, USA"],"raw_orcid":"https://orcid.org/0009-0003-2250-5528","affiliations":[{"raw_affiliation_string":"ByteDance, San Jose, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100687673","display_name":"Binbin Chen","orcid":"https://orcid.org/0000-0002-9584-0082"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Binbin Chen","raw_affiliation_strings":["ByteDance, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8598-2442","affiliations":[{"raw_affiliation_string":"ByteDance, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101661867","display_name":"Xiao He","orcid":"https://orcid.org/0000-0001-7959-2157"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao He","raw_affiliation_strings":["ByteDance, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-7959-2157","affiliations":[{"raw_affiliation_string":"ByteDance, Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068670072","display_name":"Zhihan Jiang","orcid":"https://orcid.org/0009-0003-1988-6219"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhihan Jiang","raw_affiliation_strings":["ByteDance, San Jose, USA"],"raw_orcid":"https://orcid.org/0009-0003-1988-6219","affiliations":[{"raw_affiliation_string":"ByteDance, San Jose, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100758732","display_name":"Haipeng Zhang","orcid":"https://orcid.org/0000-0001-5741-2311"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haipeng Zhang","raw_affiliation_strings":["ByteDance, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0009-4153-984X","affiliations":[{"raw_affiliation_string":"ByteDance, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134515930","display_name":"Gang Wu","orcid":"https://orcid.org/0009-0004-4048-7949"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gang Wu","raw_affiliation_strings":["ByteDance, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0004-4048-7949","affiliations":[{"raw_affiliation_string":"ByteDance, Shanghai, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5134532355","display_name":"Yi Li","orcid":"https://orcid.org/0009-0004-3069-9948"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi Li","raw_affiliation_strings":["ByteDance, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-3069-9948","affiliations":[{"raw_affiliation_string":"ByteDance, Beijing, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5134490163"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.95170725,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1565","last_page":"1580"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.13249999284744263,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.13249999284744263,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13181","display_name":"Economic and Technological Systems Analysis","score":0.05040000006556511,"subfield":{"id":"https://openalex.org/subfields/1405","display_name":"Management of Technology and Innovation"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11864","display_name":"Supply Chain Resilience and Risk Management","score":0.03709999844431877,"subfield":{"id":"https://openalex.org/subfields/1408","display_name":"Strategy and Management"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.5273000001907349},{"id":"https://openalex.org/keywords/production","display_name":"Production (economics)","score":0.5013999938964844},{"id":"https://openalex.org/keywords/change-detection","display_name":"Change detection","score":0.31029999256134033},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.28139999508857727},{"id":"https://openalex.org/keywords/risk-management","display_name":"Risk management","score":0.27390000224113464}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.5273000001907349},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.5013999938964844},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4681999981403351},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.40720000863075256},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.36059999465942383},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.33719998598098755},{"id":"https://openalex.org/C203595873","wikidata":"https://www.wikidata.org/wiki/Q25389927","display_name":"Change detection","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3767295.3803614","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767295.3803614","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 21st European Conference on Computer Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3767295.3803614","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767295.3803614","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 21st European Conference on Computer Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.5524477362632751}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W2601243251","https://openalex.org/W3003663372"],"related_works":[],"abstract_inverted_index":{"Modern":[0],"cloud":[1,46],"services":[2],"rely":[3],"on":[4],"a":[5,17,51,93,106,125,141,170],"high":[6],"volume":[7,70],"of":[8,20,44,63,71,161,163],"changes":[9,15,58,73],"for":[10,154],"rapid":[11],"innovation,":[12],"yet":[13],"these":[14],"are":[16],"primary":[18],"cause":[19],"production":[21,152,175],"incidents.":[22,182],"To":[23,87],"manage":[24],"this":[25,79,136],"risk,":[26],"industry":[27],"practice":[28],"employs":[29],"tiered":[30],"change":[31,100,127,142,164],"management":[32],"pipelines":[33],"that":[34,74,97],"concentrate":[35],"static":[36],"rules":[37],"and":[38,119,177],"human":[39],"reviews.":[40],"However,":[41],"our":[42],"analysis":[43],"ByteDance's":[45],"platform":[47],"(Volcano":[48],"Engine)":[49],"reveals":[50],"critical":[52],"long":[53],"tail":[54],"problem:":[55],"while":[56],"high-risk":[57],"undergo":[59],"extensive":[60],"scrutiny,":[61],"78.1%":[62],"change-induced":[64],"incidents":[65],"originate":[66],"from":[67,109,174],"the":[68],"sheer":[69],"low-risk":[72],"receive":[75],"minimal":[76],"review.":[77],"At":[78],"scale,":[80],"exhaustive":[81],"manual":[82],"review":[83],"is":[84,128,143],"fundamentally":[85],"infeasible.":[86],"address":[88],"this,":[89],"we":[90],"present":[91],"Aegis,":[92],"novel":[94],"knowledge-driven":[95],"system":[96],"provides":[98],"interpretable":[99],"risk":[101,117,167],"assessment.":[102],"Aegis":[103,130,148],"automatically":[104],"constructs":[105],"knowledge":[107],"base":[108],"historical":[110,137],"operational":[111],"data,":[112],"distilling":[113],"it":[114,158],"into":[115],"generalized":[116],"heuristics":[118],"identifying":[120],"relevant":[121],"precedent":[122],"cases.":[123],"When":[124],"new":[126],"proposed,":[129],"generates":[131],"human-readable":[132],"warnings":[133],"grounded":[134],"in":[135,149],"evidence,":[138],"explaining":[139],"why":[140],"risky.":[144],"We":[145],"have":[146],"deployed":[147],"Volcano":[150],"Engine's":[151],"environment":[153],"five":[155],"months,":[156],"where":[157],"processed":[159],"tens":[160],"thousands":[162],"requests.":[165],"Its":[166],"escalations":[168],"achieved":[169],"75%":[171],"acceptance":[172],"rate":[173],"engineers":[176],"successfully":[178],"prevented":[179],"multiple":[180],"potential":[181]},"counts_by_year":[],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2026-04-25T00:00:00"}
