{"id":"https://openalex.org/W4387870487","doi":"https://doi.org/10.1109/iccworkshops57953.2023.10283808","title":"Reinforcement Learning for Resource Allocation with Periodic Traffic Patterns","display_name":"Reinforcement Learning for Resource Allocation with Periodic Traffic Patterns","publication_year":2023,"publication_date":"2023-05-28","ids":{"openalex":"https://openalex.org/W4387870487","doi":"https://doi.org/10.1109/iccworkshops57953.2023.10283808"},"language":"en","primary_location":{"id":"doi:10.1109/iccworkshops57953.2023.10283808","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/iccworkshops57953.2023.10283808","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Communications Workshops (ICC Workshops)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101621051","display_name":"Zheyu Chen","orcid":"https://orcid.org/0009-0003-5779-3523"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zheyu Chen","raw_affiliation_strings":["Imperial College,London,UK","Imperial College, London, UK"],"affiliations":[{"raw_affiliation_string":"Imperial College,London,UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Imperial College, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020917506","display_name":"Kin K. Leung","orcid":"https://orcid.org/0000-0002-3860-6257"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kin K. Leung","raw_affiliation_strings":["Imperial College,London,UK","Imperial College, London, UK"],"affiliations":[{"raw_affiliation_string":"Imperial College,London,UK","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Imperial College, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100443968","display_name":"Shiqiang Wang","orcid":"https://orcid.org/0000-0003-2090-5512"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shiqiang Wang","raw_affiliation_strings":["IBM T.J. Watson Research Center,Yorktown Heights,NY,USA","IBM T.J. Watson Research Center, Yorktown Heights, NY, USA"],"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center,Yorktown Heights,NY,USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"IBM T.J. Watson Research Center, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014892027","display_name":"Leandros Tassiulas","orcid":"https://orcid.org/0000-0003-0932-774X"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Leandros Tassiulas","raw_affiliation_strings":["Yale University,New Haven,CT,USA","Yale University, New Haven, CT, USA"],"affiliations":[{"raw_affiliation_string":"Yale University,New Haven,CT,USA","institution_ids":["https://openalex.org/I32971472"]},{"raw_affiliation_string":"Yale University, New Haven, CT, USA","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057402438","display_name":"Kevin Chan","orcid":"https://orcid.org/0000-0002-6425-5403"},"institutions":[{"id":"https://openalex.org/I2802705668","display_name":"United States Army Combat Capabilities Development Command","ror":"https://ror.org/02rdkx920","country_code":"US","type":"other","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2802705668","https://openalex.org/I4210154437"]},{"id":"https://openalex.org/I166416128","display_name":"DEVCOM Army Research Laboratory","ror":"https://ror.org/011hc8f90","country_code":"US","type":"government","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I166416128","https://openalex.org/I2802705668","https://openalex.org/I4210154437"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kevin Chan","raw_affiliation_strings":["DEVCOM Army Research Laboratory,Adelphi,MD,USA","DEVCOM Army Research Laboratory, Adelphi, MD, USA"],"affiliations":[{"raw_affiliation_string":"DEVCOM Army Research Laboratory,Adelphi,MD,USA","institution_ids":["https://openalex.org/I166416128","https://openalex.org/I2802705668"]},{"raw_affiliation_string":"DEVCOM Army Research Laboratory, Adelphi, MD, USA","institution_ids":["https://openalex.org/I166416128","https://openalex.org/I2802705668"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085092796","display_name":"Patrick J. Baker","orcid":"https://orcid.org/0000-0002-6560-7124"},"institutions":[{"id":"https://openalex.org/I2800289278","display_name":"Royal Air Force College Cranwell","ror":"https://ror.org/01g0pjd14","country_code":"GB","type":"education","lineage":["https://openalex.org/I2800289278"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Patrick J. Baker","raw_affiliation_strings":["UK Royal Air Force and Dstl,UK","UK Royal Air Force and Dstl, UK"],"affiliations":[{"raw_affiliation_string":"UK Royal Air Force and Dstl,UK","institution_ids":["https://openalex.org/I2800289278"]},{"raw_affiliation_string":"UK Royal Air Force and Dstl, UK","institution_ids":["https://openalex.org/I2800289278"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101621051"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16373018,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"752","last_page":"757"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8322553038597107},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.828486442565918},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.79051673412323},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6725400686264038},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.6675384640693665},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.569835364818573},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5302923321723938},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5224694013595581},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5132837295532227},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.46755850315093994},{"id":"https://openalex.org/keywords/resource-management","display_name":"Resource management (computing)","score":0.4465208649635315},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4198695421218872},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3431164622306824},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.26406192779541016},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1216505765914917},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.10362958908081055},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08758074045181274},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07515561580657959}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8322553038597107},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.828486442565918},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79051673412323},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6725400686264038},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.6675384640693665},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.569835364818573},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5302923321723938},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5224694013595581},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5132837295532227},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.46755850315093994},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.4465208649635315},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4198695421218872},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3431164622306824},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.26406192779541016},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1216505765914917},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.10362958908081055},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08758074045181274},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07515561580657959},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccworkshops57953.2023.10283808","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/iccworkshops57953.2023.10283808","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Communications Workshops (ICC Workshops)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1977556410","https://openalex.org/W1990667931","https://openalex.org/W1990862669","https://openalex.org/W1993476605","https://openalex.org/W2075557304","https://openalex.org/W2076330565","https://openalex.org/W2171092272","https://openalex.org/W2396221166","https://openalex.org/W2736601468","https://openalex.org/W2791730371","https://openalex.org/W2900204506","https://openalex.org/W2920054549","https://openalex.org/W2953169926","https://openalex.org/W3045232563","https://openalex.org/W3185035147","https://openalex.org/W6644682428","https://openalex.org/W6712528029","https://openalex.org/W6741002519"],"related_works":["https://openalex.org/W187740018","https://openalex.org/W2162286586","https://openalex.org/W2923452570","https://openalex.org/W4255368532","https://openalex.org/W206598027","https://openalex.org/W2978610750","https://openalex.org/W2022931285","https://openalex.org/W1589966275","https://openalex.org/W2086872282","https://openalex.org/W2137789903"],"abstract_inverted_index":{"It":[0],"is":[1,135],"common":[2],"to":[3,74,103,127],"formulate":[4],"resource-allocation":[5,130],"problems":[6,69],"in":[7,145,154],"communication":[8],"networks":[9],"as":[10],"Markov":[11],"decision":[12],"process":[13,111],"(MDP)":[14],"and":[15,86,112],"solve":[16],"it":[17],"by":[18,167],"using":[19,149,168,175],"deep":[20],"reinforcement":[21],"learning":[22],"(DRL)":[23],"techniques.":[24],"However,":[25],"this":[26],"approach":[27],"often":[28],"cannot":[29],"find":[30],"the":[31,44,49,54,57,61,68,105,108,114,129,139,146,150,155,163,169],"optimal":[32],"action":[33],"policy":[34],"when":[35],"task":[36,109,152,164],"(demand)":[37],"arrivals":[38,153],"present":[39],"a":[40,80,92,97,121,133],"periodic":[41,62],"pattern":[42],"since":[43],"systems":[45],"do":[46],"not":[47],"satisfy":[48],"underlying":[50],"mathematical":[51],"properties":[52],"of":[53,83,107,123,142,172,182],"MDP.":[55],"On":[56],"other":[58],"hand,":[59],"solving":[60],"MDP,":[63],"which":[64],"can":[65,177],"precisely":[66],"model":[67,128],"under":[70],"consideration,":[71],"may":[72],"need":[73],"generate":[75],"many":[76],"policies,":[77],"thus":[78],"requiring":[79],"prohibitive":[81],"amount":[82],"computation":[84],"resources":[85],"excessive":[87],"training":[88],"time.":[89],"To":[90],"achieve":[91],"balanced":[93],"trade-off,":[94],"we":[95],"propose":[96],"DRL":[98,176],"framework":[99,171],"that":[100,120,162],"includes":[101],"procedures":[102],"determine":[104],"period":[106,115],"arrival":[110],"partition":[113],"into":[116],"time":[117],"intervals":[118],"so":[119],"sequence":[122],"MDPs":[124,143],"are":[125],"used":[126,144],"problems.":[131],"Furthermore,":[132],"method":[134],"proposed":[136,170],"for":[137],"choosing":[138],"appropriate":[140],"number":[141],"framework.":[147],"By":[148],"practical":[151],"Alibaba":[156],"dataset,":[157],"our":[158],"experimental":[159],"results":[160],"reveal":[161],"utilities":[165],"obtained":[166],"sequential":[173],"policies":[174],"yield":[178],"an":[179,187],"average":[180],"improvement":[181],"23%":[183],"over":[184],"those":[185],"from":[186],"RL":[188],"solution":[189],"with":[190],"one":[191],"single":[192],"policy.":[193]},"counts_by_year":[],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
