{"id":"https://openalex.org/W4294811272","doi":"https://doi.org/10.1109/tccn.2022.3204572","title":"Learning From Peers: Deep Transfer Reinforcement Learning for Joint Radio and Cache Resource Allocation in 5G RAN Slicing","display_name":"Learning From Peers: Deep Transfer Reinforcement Learning for Joint Radio and Cache Resource Allocation in 5G RAN Slicing","publication_year":2022,"publication_date":"2022-09-06","ids":{"openalex":"https://openalex.org/W4294811272","doi":"https://doi.org/10.1109/tccn.2022.3204572"},"language":"en","primary_location":{"id":"doi:10.1109/tccn.2022.3204572","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2022.3204572","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080850676","display_name":"Hao Zhou","orcid":"https://orcid.org/0000-0002-5511-4609"},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Hao Zhou","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, Canada"],"raw_orcid":"https://orcid.org/0000-0002-5511-4609","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089891162","display_name":"Melike Erol\u2010Kantarci","orcid":"https://orcid.org/0000-0001-6787-8457"},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Melike Erol-Kantarci","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, Canada"],"raw_orcid":"https://orcid.org/0000-0001-6787-8457","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"last","author":{"id":null,"display_name":"H. Vincent Poor","orcid":"https://orcid.org/0000-0002-8068-5120"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"H. Vincent Poor","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"raw_orcid":"https://orcid.org/0000-0002-8068-5120","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5080850676"],"corresponding_institution_ids":["https://openalex.org/I153718931"],"apc_list":null,"apc_paid":null,"fwci":6.4203,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.97084981,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"8","issue":"4","first_page":"1925","last_page":"1941"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12791","display_name":"Full-Duplex Wireless Communications","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9002482891082764},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8712766766548157},{"id":"https://openalex.org/keywords/radio-access-network","display_name":"Radio access network","score":0.6604164838790894},{"id":"https://openalex.org/keywords/c-ran","display_name":"C-RAN","score":0.5567286014556885},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.5515312552452087},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.4782480299472809},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4714159667491913},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.4609852731227875},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.459652841091156},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43709596991539},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.43638747930526733},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.42484188079833984},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42058265209198},{"id":"https://openalex.org/keywords/orchestration","display_name":"Orchestration","score":0.4119298458099365},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.26050886511802673},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.21564513444900513},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12391793727874756}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9002482891082764},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8712766766548157},{"id":"https://openalex.org/C106365562","wikidata":"https://www.wikidata.org/wiki/Q3078360","display_name":"Radio access network","level":4,"score":0.6604164838790894},{"id":"https://openalex.org/C2779765720","wikidata":"https://www.wikidata.org/wiki/Q5005908","display_name":"C-RAN","level":5,"score":0.5567286014556885},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.5515312552452087},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.4782480299472809},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4714159667491913},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.4609852731227875},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.459652841091156},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43709596991539},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.43638747930526733},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.42484188079833984},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42058265209198},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.4119298458099365},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.26050886511802673},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.21564513444900513},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12391793727874756},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C207029474","wikidata":"https://www.wikidata.org/wiki/Q384018","display_name":"Mobile station","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tccn.2022.3204572","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2022.3204572","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6552507291","display_name":null,"funder_award_id":"497981","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"},{"id":"https://openalex.org/G8554439942","display_name":null,"funder_award_id":"CNS-2128448","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1504915502","https://openalex.org/W1549860141","https://openalex.org/W1591992921","https://openalex.org/W2028344184","https://openalex.org/W2097381042","https://openalex.org/W2105960367","https://openalex.org/W2133040789","https://openalex.org/W2136547295","https://openalex.org/W2136848157","https://openalex.org/W2145339207","https://openalex.org/W2164114810","https://openalex.org/W2165698076","https://openalex.org/W2605344455","https://openalex.org/W2624944960","https://openalex.org/W2794138919","https://openalex.org/W2794673877","https://openalex.org/W2804647677","https://openalex.org/W2805173205","https://openalex.org/W2891286892","https://openalex.org/W2914785290","https://openalex.org/W2951714068","https://openalex.org/W2961380111","https://openalex.org/W2963334314","https://openalex.org/W2963829278","https://openalex.org/W2964000600","https://openalex.org/W2970759804","https://openalex.org/W2989639897","https://openalex.org/W2989734355","https://openalex.org/W3009197653","https://openalex.org/W3013469985","https://openalex.org/W3023434827","https://openalex.org/W3039237082","https://openalex.org/W3091704528","https://openalex.org/W3113734015","https://openalex.org/W3205905181","https://openalex.org/W3209687765","https://openalex.org/W3217599394","https://openalex.org/W4383112908","https://openalex.org/W6635516443","https://openalex.org/W6674600207","https://openalex.org/W6675715384","https://openalex.org/W6679818365","https://openalex.org/W6774697201","https://openalex.org/W6783144354"],"related_works":["https://openalex.org/W2592537445","https://openalex.org/W2117039245","https://openalex.org/W2497039592","https://openalex.org/W3138350675","https://openalex.org/W2436923341","https://openalex.org/W2902173727","https://openalex.org/W4287262510","https://openalex.org/W2064969374","https://openalex.org/W4205856738","https://openalex.org/W2885291556"],"abstract_inverted_index":{"Network":[0],"slicing":[1],"is":[2],"a":[3,71,93],"critical":[4],"technique":[5],"for":[6,48,78,96,172,184],"5G":[7,87],"communications":[8],"that":[9],"covers":[10],"radio":[11,33,80],"access":[12],"network":[13,22,29,49],"(RAN),":[14],"edge,":[15],"transport":[16],"and":[17,34,81,112,151,157,180,203],"core":[18],"slicing.":[19,89],"The":[20,137],"evolving":[21],"architecture":[23,95],"requires":[24],"the":[25,60,121,144,152],"orchestration":[26],"of":[27,59],"multiple":[28],"resources":[30],"such":[31],"as":[32],"cache":[35,82],"resources.":[36],"In":[37,66,120],"recent":[38],"years,":[39],"machine":[40],"learning":[41,75,110,118],"(ML)":[42],"techniques":[43],"have":[44],"been":[45],"widely":[46],"applied":[47],"management.":[50],"However,":[51],"most":[52],"existing":[53],"works":[54],"do":[55],"not":[56],"take":[57],"advantage":[58],"knowledge":[61,129],"transfer":[62,73,108,116],"capability":[63],"in":[64],"ML.":[65],"this":[67],"paper,":[68],"we":[69,101],"propose":[70,102],"deep":[72,107,115,148],"reinforcement":[74,109,117],"(DTRL)":[76],"scheme":[77],"joint":[79,97],"resource":[83,98],"allocation":[84],"to":[85,130,212],"serve":[86],"RAN":[88],"We":[90],"first":[91],"define":[92],"hierarchical":[94],"allocation.":[99],"Then":[100],"two":[103],"DTRL":[104],"algorithms:":[105],"Q-value-based":[106],"(QDTRL)":[111],"action":[113],"selection-based":[114],"(ADTRL).":[119],"proposed":[122,138,165],"schemes,":[123],"learner":[124],"agents":[125],"utilize":[126],"expert":[127],"agents\u2019":[128],"improve":[131],"their":[132],"performance":[133],"on":[134],"current":[135],"tasks.":[136],"algorithms":[139],"are":[140,208],"compared":[141],"with":[142,162,210],"both":[143],"model-free":[145],"exploration":[146],"bonus":[147],"Q-learning":[149],"(EB-DQN)":[150],"model-based":[153],"priority":[154],"proportional":[155],"fairness":[156],"time-to-live":[158],"(PPF-TTL)":[159],"algorithms.":[160],"Compared":[161],"EB-DQN,":[163],"our":[164],"DTRL-based":[166],"method":[167],"presents":[168],"21.4%":[169],"lower":[170,200],"delay":[171,202],"Ultra":[173],"Reliable":[174],"Low":[175],"Latency":[176],"Communications":[177],"(URLLC)":[178],"slice":[179],"22.4%":[181],"higher":[182,205],"throughput":[183,207],"enhanced":[185],"Mobile":[186],"Broad":[187],"Band":[188],"(eMBB)":[189],"slice,":[190],"while":[191],"achieving":[192],"significantly":[193],"faster":[194],"convergence":[195],"than":[196],"EB-DQN.":[197],"Moreover,":[198],"40.8%":[199],"URLLC":[201],"59.8%":[204],"eMBB":[206],"observed":[209],"respect":[211],"PPF-TTL.":[213]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
