{"id":"https://openalex.org/W7139130221","doi":"https://doi.org/10.1109/tpds.2026.3674891","title":"Scalable and Efficient Reinforcement Learning for Virtual Machine Rescheduling in Cloud Data Centers","display_name":"Scalable and Efficient Reinforcement Learning for Virtual Machine Rescheduling in Cloud Data Centers","publication_year":2026,"publication_date":"2026-03-18","ids":{"openalex":"https://openalex.org/W7139130221","doi":"https://doi.org/10.1109/tpds.2026.3674891"},"language":null,"primary_location":{"id":"doi:10.1109/tpds.2026.3674891","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2026.3674891","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108940900","display_name":"Xianzhong Ding","orcid":null},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xianzhong Ding","raw_affiliation_strings":["Lawrence Berkeley National Laboratory, Berkeley, CA, USA"],"raw_orcid":"https://orcid.org/0000-0001-6114-2801","affiliations":[{"raw_affiliation_string":"Lawrence Berkeley National Laboratory, Berkeley, CA, USA","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130019969","display_name":"Yunkai Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yunkai Zhang","raw_affiliation_strings":["University of California, Berkeley, Berkeley, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-7203-2883","affiliations":[{"raw_affiliation_string":"University of California, Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074940669","display_name":"Binbin Chen","orcid":"https://orcid.org/0000-0002-7760-3120"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Binbin Chen","raw_affiliation_strings":["ByteDance, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ByteDance, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065161741","display_name":"Donghao Ying","orcid":"https://orcid.org/0009-0001-7329-5917"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Donghao Ying","raw_affiliation_strings":["University of California, Berkeley, Berkeley, CA, USA"],"raw_orcid":"https://orcid.org/0009-0001-7329-5917","affiliations":[{"raw_affiliation_string":"University of California, Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129935715","display_name":"Tieying Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tieying Zhang","raw_affiliation_strings":["ByteDance, San Jose, CA, USA"],"raw_orcid":"https://orcid.org/0009-0003-2250-5528","affiliations":[{"raw_affiliation_string":"ByteDance, San Jose, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130106669","display_name":"Jianjun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianjun Chen","raw_affiliation_strings":["ByteDance, San Jose, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ByteDance, San Jose, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083446090","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0001-7569-2118"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["ByteDance, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ByteDance, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044884862","display_name":"Alberto Cerpa","orcid":"https://orcid.org/0000-0003-4531-9704"},"institutions":[{"id":"https://openalex.org/I156087764","display_name":"University of California, Merced","ror":"https://ror.org/00d9ah105","country_code":"US","type":"education","lineage":["https://openalex.org/I156087764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alberto Cerpa","raw_affiliation_strings":["University of California, Merced, Merced, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-4531-9704","affiliations":[{"raw_affiliation_string":"University of California, Merced, Merced, CA, USA","institution_ids":["https://openalex.org/I156087764"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130120933","display_name":"Wan Du","orcid":null},"institutions":[{"id":"https://openalex.org/I156087764","display_name":"University of California, Merced","ror":"https://ror.org/00d9ah105","country_code":"US","type":"education","lineage":["https://openalex.org/I156087764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wan Du","raw_affiliation_strings":["University of California, Merced, Merced, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-2057-2885","affiliations":[{"raw_affiliation_string":"University of California, Merced, Merced, CA, USA","institution_ids":["https://openalex.org/I156087764"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5108940900"],"corresponding_institution_ids":["https://openalex.org/I148283060"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.61767291,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"37","issue":"5","first_page":"1186","last_page":"1204"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.927299976348877,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.927299976348877,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.019300000742077827,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.014100000262260437,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7580000162124634},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.724399983882904},{"id":"https://openalex.org/keywords/virtual-machine","display_name":"Virtual machine","score":0.6953999996185303},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.6912999749183655},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5449000000953674},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.45190000534057617},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4235000014305115},{"id":"https://openalex.org/keywords/data-center","display_name":"Data center","score":0.42309999465942383},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41359999775886536}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8920000195503235},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7580000162124634},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.724399983882904},{"id":"https://openalex.org/C25344961","wikidata":"https://www.wikidata.org/wiki/Q192726","display_name":"Virtual machine","level":2,"score":0.6953999996185303},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.6912999749183655},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.6499000191688538},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5449000000953674},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.45190000534057617},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4235000014305115},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41359999775886536},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4016000032424927},{"id":"https://openalex.org/C2778710394","wikidata":"https://www.wikidata.org/wiki/Q4179813","display_name":"Live migration","level":4,"score":0.3880000114440918},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.37220001220703125},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3499999940395355},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.3465000092983246},{"id":"https://openalex.org/C513985346","wikidata":"https://www.wikidata.org/wiki/Q270471","display_name":"Virtualization","level":3,"score":0.32659998536109924},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2639999985694885},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.2624000012874603},{"id":"https://openalex.org/C191015642","wikidata":"https://www.wikidata.org/wiki/Q1132459","display_name":"Fragmentation (computing)","level":2,"score":0.2513999938964844},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2026.3674891","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2026.3674891","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Managing":[0],"a":[1,10,98,113,122,134,154,174],"vast":[2],"number":[3],"of":[4,23,65,176],"virtual":[5],"machines":[6,31],"(VMs)":[7],"efficiently":[8],"is":[9,56,68],"critical":[11,128],"challenge":[12,55],"in":[13,50],"modern":[14],"large-scale":[15],"data":[16,152,156],"centers.":[17],"The":[18],"continuous":[19],"creation":[20],"and":[21,133,145,187],"termination":[22],"VMs":[24],"lead":[25],"to":[26,37,117,141,173,184],"resource":[27,39],"fragmentation":[28],"across":[29],"physical":[30],"(PMs),":[32],"necessitating":[33],"periodic":[34],"VM":[35,44,75,104],"rescheduling":[36,45,66,146],"optimize":[38],"utilization.":[40],"Despite":[41],"its":[42],"significance,":[43],"has":[46],"received":[47],"limited":[48],"attention":[49],"the":[51,63],"literature.":[52],"A":[53],"key":[54],"that,":[57],"unlike":[58],"conventional":[59],"combinatorial":[60],"optimization":[61],"problems,":[62],"efficiency":[64],"algorithms":[67],"heavily":[69],"impacted":[70],"by":[71],"inference":[72,171],"time,":[73],"as":[74],"states":[76],"evolve":[77],"dynamically":[78],"during":[79],"execution.":[80],"This":[81],"scalability":[82],"bottleneck":[83],"hampers":[84],"existing":[85],"methods.":[86],"To":[87,178],"address":[88],"this,":[89],"we":[90,181],"propose":[91],"VMR":[92,106,160],"<inline-formula":[93,107,161],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[94,108,162],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[95,109,163],"notation=\"LaTeX\">$^{2}$</tex-math></inline-formula>":[96,110,164],"L,":[97],"reinforcement":[99],"learning":[100],"framework":[101],"tailored":[102],"for":[103,131],"rescheduling.":[105],"L":[111,165],"integrates":[112],"two-stage":[114],"decision-making":[115],"process":[116],"accommodate":[118],"complex":[119],"operational":[120],"constraints,":[121],"feature":[123],"extraction":[124],"mechanism":[125],"that":[126,138,159],"captures":[127],"relational":[129],"information":[130],"rescheduling,":[132],"risk-aware":[135],"evaluation":[136],"strategy":[137],"enables":[139],"users":[140],"balance":[142],"execution":[143],"speed":[144],"accuracy.":[147],"Extensive":[148],"experiments":[149],"using":[150],"real-world":[151],"from":[153],"production-scale":[155],"center":[157],"demonstrate":[158],"achieves":[166],"near-optimal":[167],"performance":[168],"while":[169],"reducing":[170],"time":[172],"matter":[175],"seconds.":[177],"facilitate":[179],"reproducibility,":[180],"provide":[182],"access":[183],"our":[185],"implementation":[186],"datasets.":[188]},"counts_by_year":[],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2026-03-20T00:00:00"}
