{"id":"https://openalex.org/W4384161787","doi":"https://doi.org/10.1109/tgcn.2023.3295341","title":"Toward Scalable and Efficient Hierarchical Deep Reinforcement Learning for 5G RAN Slicing","display_name":"Toward Scalable and Efficient Hierarchical Deep Reinforcement Learning for 5G RAN Slicing","publication_year":2023,"publication_date":"2023-07-13","ids":{"openalex":"https://openalex.org/W4384161787","doi":"https://doi.org/10.1109/tgcn.2023.3295341"},"language":"en","primary_location":{"id":"doi:10.1109/tgcn.2023.3295341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgcn.2023.3295341","pdf_url":null,"source":{"id":"https://openalex.org/S4210192662","display_name":"IEEE Transactions on Green Communications and Networking","issn_l":"2473-2400","issn":["2473-2400"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Green Communications and Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040803715","display_name":"Renlang Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Renlang Huang","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024793874","display_name":"Miao Guo","orcid":"https://orcid.org/0000-0002-7940-5590"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Miao Guo","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074511454","display_name":"Chaojie Gu","orcid":"https://orcid.org/0000-0003-2153-811X"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaojie Gu","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068195118","display_name":"Shibo He","orcid":"https://orcid.org/0000-0002-1505-6766"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shibo He","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100726041","display_name":"Jiming Chen","orcid":"https://orcid.org/0000-0003-3155-3145"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiming Chen","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079378336","display_name":"Mingyang Sun","orcid":"https://orcid.org/0000-0002-5790-5025"},"institutions":[{"id":"https://openalex.org/I4391767838","display_name":"State Key Laboratory of Industrial Control Technology","ror":"https://ror.org/03a33a786","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767838","https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyang Sun","raw_affiliation_strings":["State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Industrial Control Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4391767838"]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5040803715"],"corresponding_institution_ids":["https://openalex.org/I4391767838"],"apc_list":null,"apc_paid":null,"fwci":2.3865,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89263165,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"7","issue":"4","first_page":"2153","last_page":"2162"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13731","display_name":"Advanced Computing and Algorithms","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/3322","display_name":"Urban Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8431919813156128},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7667170763015747},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7297543287277222},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.645164430141449},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.6010034680366516},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.520774781703949},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.47854381799697876},{"id":"https://openalex.org/keywords/slicing","display_name":"Slicing","score":0.47590288519859314},{"id":"https://openalex.org/keywords/heterogeneous-network","display_name":"Heterogeneous network","score":0.4459804892539978},{"id":"https://openalex.org/keywords/resource-management","display_name":"Resource management (computing)","score":0.42279040813446045},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.4016577899456024},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3343610167503357},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.1673101782798767},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.08548399806022644},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.07873240113258362}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8431919813156128},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7667170763015747},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7297543287277222},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.645164430141449},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.6010034680366516},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.520774781703949},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.47854381799697876},{"id":"https://openalex.org/C2776190703","wikidata":"https://www.wikidata.org/wiki/Q488148","display_name":"Slicing","level":2,"score":0.47590288519859314},{"id":"https://openalex.org/C158207573","wikidata":"https://www.wikidata.org/wiki/Q5747224","display_name":"Heterogeneous network","level":4,"score":0.4459804892539978},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.42279040813446045},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.4016577899456024},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3343610167503357},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.1673101782798767},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.08548399806022644},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.07873240113258362},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgcn.2023.3295341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgcn.2023.3295341","pdf_url":null,"source":{"id":"https://openalex.org/S4210192662","display_name":"IEEE Transactions on Green Communications and Networking","issn_l":"2473-2400","issn":["2473-2400"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Green Communications and Networking","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5600000023841858,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G2575069074","display_name":null,"funder_award_id":"62088101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3654453020","display_name":null,"funder_award_id":"2020YFB1708700","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G673267744","display_name":null,"funder_award_id":"226-2023-00111","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G6825229344","display_name":null,"funder_award_id":"226-2022-00107","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G8022898299","display_name":null,"funder_award_id":"U1909207","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W2133479744","https://openalex.org/W2145339207","https://openalex.org/W2147524058","https://openalex.org/W2615459164","https://openalex.org/W2736601468","https://openalex.org/W2744628735","https://openalex.org/W2746553466","https://openalex.org/W2788005034","https://openalex.org/W2963864421","https://openalex.org/W2968986602","https://openalex.org/W2989178978","https://openalex.org/W3002189898","https://openalex.org/W3023243578","https://openalex.org/W3039941973","https://openalex.org/W3049282540","https://openalex.org/W3091704528","https://openalex.org/W3110381504","https://openalex.org/W3115726903","https://openalex.org/W3123346421","https://openalex.org/W3170397984","https://openalex.org/W3176770340","https://openalex.org/W3201276757","https://openalex.org/W3216833280","https://openalex.org/W4206028292","https://openalex.org/W4206957298","https://openalex.org/W4210291334","https://openalex.org/W4292862193","https://openalex.org/W6638018090","https://openalex.org/W6683204974","https://openalex.org/W6684921986","https://openalex.org/W6685444567","https://openalex.org/W6692846177","https://openalex.org/W6703271639","https://openalex.org/W6741002519","https://openalex.org/W6748839928","https://openalex.org/W6762728350","https://openalex.org/W6801042162"],"related_works":["https://openalex.org/W2795085641","https://openalex.org/W2923452570","https://openalex.org/W206598027","https://openalex.org/W2978610750","https://openalex.org/W2022931285","https://openalex.org/W1589966275","https://openalex.org/W2086872282","https://openalex.org/W2137789903","https://openalex.org/W2138781885","https://openalex.org/W2153007255"],"abstract_inverted_index":{"As":[0],"an":[1,92],"emerging":[2],"and":[3,26,31,42,67,81,98,104,113,128,147,149,157,167,174],"promising":[4],"network":[5,7,29,61,154,163,191,195],"paradigm,":[6],"slicing":[8,62],"creates":[9],"multiple":[10],"logical":[11],"networks":[12],"on":[13],"shared":[14],"infrastructure":[15],"to":[16,64,109,120,188],"provide":[17],"services":[18],"with":[19,91,170],"customized":[20],"Quality-of-Service":[21],"(QoS)":[22],"for":[23],"heterogeneous":[24],"devices":[25],"applications.":[27],"However,":[28],"complexity":[30],"service":[32],"heterogeneity":[33],"pose":[34],"a":[35,52,78],"huge":[36],"challenge":[37],"in":[38,153,190],"achieving":[39,99],"optimal":[40],"performance":[41],"ensuring":[43],"stringent":[44],"QoS":[45,158],"requirements.":[46],"In":[47],"this":[48],"paper,":[49],"we":[50,180],"design":[51],"hierarchical":[53],"deep":[54],"reinforcement":[55],"learning":[56,106],"based":[57],"5G":[58],"radio":[59],"access":[60],"framework":[63,87,139,184],"achieve":[65],"scalable":[66,100],"efficient":[68],"resource":[69,74,143],"allocation.":[70],"By":[71],"decomposing":[72],"the":[73,85,137,162,171,175],"allocation":[75,144],"problem":[76],"into":[77],"slice-level":[79],"task":[80,90],"several":[82],"user-level":[83],"tasks,":[84],"proposed":[86,138],"tackles":[88],"each":[89],"agent,":[93],"thus":[94],"conquering":[95],"insufficient":[96],"exploration":[97],"management.":[101],"Knowledge":[102],"transfer":[103],"progressive":[105],"are":[107],"employed":[108],"improve":[110],"training":[111,119],"efficiency":[112],"stability,":[114],"respectively.":[115,178],"We":[116],"apply":[117],"collaborative":[118],"eliminate":[121],"distribution":[122],"mismatch":[123],"by":[124,165],"refining":[125],"value":[126],"approximators":[127],"policies":[129,145],"of":[130],"agents":[131],"alternately.":[132],"Extensive":[133],"experiments":[134],"show":[135],"that":[136,182],"can":[140],"learn":[141],"effective":[142],"stably":[146],"efficiently":[148],"outperform":[150],"other":[151],"methods":[152],"utility":[155,164],"maximization":[156],"assurance,":[159],"which":[160],"improves":[161],"25%":[166],"8%":[168],"compared":[169],"random":[172],"strategy":[173],"ADMM":[176],"strategy,":[177],"Furthermore,":[179],"validate":[181],"our":[183],"is":[185],"more":[186],"robust":[187],"changes":[189],"traffic":[192],"conditions":[193],"including":[194],"congestion.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
