{"id":"https://openalex.org/W4408325077","doi":"https://doi.org/10.1109/globecom52923.2024.10901010","title":"Scalable Dynamic Resource Allocation via Domain Randomized Reinforcement Learning","display_name":"Scalable Dynamic Resource Allocation via Domain Randomized Reinforcement Learning","publication_year":2024,"publication_date":"2024-12-08","ids":{"openalex":"https://openalex.org/W4408325077","doi":"https://doi.org/10.1109/globecom52923.2024.10901010"},"language":"en","primary_location":{"id":"doi:10.1109/globecom52923.2024.10901010","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom52923.2024.10901010","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2024 - 2024 IEEE Global Communications Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100731440","display_name":"Yiqi Wang","orcid":"https://orcid.org/0000-0002-9657-3617"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiqi Wang","raw_affiliation_strings":["Carnegie Mellon University,Electrical and Computer Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Electrical and Computer Engineering","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075795654","display_name":"Laixi Shi","orcid":"https://orcid.org/0000-0003-4038-8620"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Laixi Shi","raw_affiliation_strings":["California Institute of Technology,Computing and Mathematical Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"California Institute of Technology,Computing and Mathematical Sciences","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051133896","display_name":"Martin Hyungwoo Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Martin Hyungwoo Lee","raw_affiliation_strings":["Carnegie Mellon University,Electrical and Computer Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Electrical and Computer Engineering","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113534922","display_name":"Jaroslaw J. Sydir","orcid":"https://orcid.org/0009-0005-6493-7710"},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jaroslaw Sydir","raw_affiliation_strings":["Intel Labs Intel Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100940923","display_name":"Zhou Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhu Zhou","raw_affiliation_strings":["Intel Labs Intel Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053809095","display_name":"Yuejie Chi","orcid":"https://orcid.org/0000-0002-6766-5459"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuejie Chi","raw_affiliation_strings":["Carnegie Mellon University,Electrical and Computer Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Electrical and Computer Engineering","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100365126","display_name":"Bin Li","orcid":"https://orcid.org/0000-0001-8500-9917"},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Bin Li","raw_affiliation_strings":["Intel Labs Intel Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24196157,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2635","last_page":"2640"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.8105000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.8105000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.7932000160217285,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7342000007629395,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8649391531944275},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7981365323066711},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7028185725212097},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.5915393829345703},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.486868292093277},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4499172568321228},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2782897353172302},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.15474796295166016},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.07099536061286926}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8649391531944275},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7981365323066711},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7028185725212097},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.5915393829345703},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.486868292093277},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4499172568321228},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2782897353172302},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.15474796295166016},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.07099536061286926},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/globecom52923.2024.10901010","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom52923.2024.10901010","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2024 - 2024 IEEE Global Communications Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1603238809","https://openalex.org/W2151504984","https://openalex.org/W2760103357","https://openalex.org/W2769883686","https://openalex.org/W3049258101","https://openalex.org/W4214717370","https://openalex.org/W4324370128","https://openalex.org/W6637967152"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W1982914007","https://openalex.org/W2159583675","https://openalex.org/W1824242903","https://openalex.org/W1493858311","https://openalex.org/W2155470929","https://openalex.org/W2111125783","https://openalex.org/W2394465510","https://openalex.org/W2158842975"],"abstract_inverted_index":{"In":[0],"5G":[1],"wireless":[2],"networks,":[3],"the":[4,30,39,56,77,98,102,117,121,170,227],"User":[5],"Plane":[6],"Function":[7],"(UPF)":[8],"plays":[9],"a":[10,19,137,150,159,178],"crucial":[11],"role":[12],"in":[13,101,112],"efficiently":[14],"transferring":[15],"users\u2019":[16],"traffic":[17,53,107,114,123,132],"\u2014":[18,24],"series":[20],"of":[21,161],"data":[22,180],"packets":[23],"to":[25,46,75,124,157,210,226],"manage":[26],"internet":[27],"communications.":[28],"Setting":[29],"server\u2019s":[31],"processor":[32,58],"frequency":[33,59,172],"excessively":[34],"high":[35],"can":[36,115],"easily":[37],"meet":[38],"packet":[40,68,187],"drop":[41,69],"requirements":[42],"but":[43],"may":[44],"lead":[45],"unnecessary":[47],"power":[48,64,217],"consumption.":[49],"Therefore,":[50],"as":[51],"user":[52,113],"fluctuates,":[54],"selecting":[55],"optimal":[57,171],"is":[60],"essential":[61],"for":[62,206],"minimizing":[63],"consumption":[65,218],"while":[66],"satisfying":[67],"constraints.":[70],"This":[71,147],"challenge":[72],"motivates":[73],"us":[74],"address":[76,130],"dynamic":[78],"resource":[79,212],"(frequency)":[80],"allocation":[81,213],"problem,":[82],"where":[83],"deep":[84],"reinforcement":[85],"learning":[86],"(RL)":[87],"has":[88],"shown":[89],"significant":[90],"potential.":[91],"Most":[92],"existing":[93],"studies":[94],"train":[95],"and":[96,164,223],"evaluate":[97],"RL":[99,139],"model":[100],"same":[103],"environment":[104],"with":[105,142],"consistent":[106],"patterns.":[108],"However,":[109],"frequent":[110],"variations":[111],"cause":[116],"policy":[118,162,175],"trained":[119,198],"on":[120,127,189,199],"outdated":[122],"fail":[125],"catastrophically":[126],"unseen":[128,191],"traffic.To":[129],"such":[131],"distribution":[133],"shifts,":[134],"we":[135],"propose":[136],"two-phase":[138],"approach":[140],"augmented":[141],"Automatic":[143],"Domain":[144],"Randomization":[145],"(RL-ADR).":[146],"method":[148],"includes":[149],"training":[151],"phase":[152,167],"that":[153,168,203],"utilizes":[154],"domain":[155],"randomization":[156],"create":[158],"library":[160,176],"candidates,":[163],"an":[165],"inference":[166],"selects":[169],"using":[173],"this":[174],"alongside":[177],"safe":[179],"buffer.":[181],"The":[182],"proposed":[183],"RL-ADR":[184,215],"achieves":[185],"zero":[186],"drops":[188],"two":[190],"long-horizon":[192],"traffics":[193,202],"(3":[194],"hours)":[195],"after":[196],"being":[197],"25":[200],"synthetic":[201],"only":[204],"span":[205],"18":[207],"seconds.":[208],"Compared":[209],"static":[211],"baselines,":[214],"reduces":[216],"by":[219],"at":[220],"least":[221],"14.5%":[222],"performs":[224],"comparably":[225],"oracle":[228],"solution.":[229]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
