{"id":"https://openalex.org/W3126805270","doi":"https://doi.org/10.1109/tnet.2021.3051663","title":"Learning to Schedule Network Resources Throughput and Delay Optimally Using Q<sup>+</sup>-Learning","display_name":"Learning to Schedule Network Resources Throughput and Delay Optimally Using Q<sup>+</sup>-Learning","publication_year":2021,"publication_date":"2021-01-26","ids":{"openalex":"https://openalex.org/W3126805270","doi":"https://doi.org/10.1109/tnet.2021.3051663","mag":"3126805270"},"language":"en","primary_location":{"id":"doi:10.1109/tnet.2021.3051663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnet.2021.3051663","pdf_url":null,"source":{"id":"https://openalex.org/S62238642","display_name":"IEEE/ACM Transactions on Networking","issn_l":"1063-6692","issn":["1063-6692","1558-2566"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106761258","display_name":"Jeongmin Bae","orcid":"https://orcid.org/0000-0002-7430-0183"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jeongmin Bae","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100318495","display_name":"Joohyun Lee","orcid":"https://orcid.org/0000-0002-7698-1568"},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"education","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Joohyun Lee","raw_affiliation_strings":["Division of Electrical Engineering, Hanyang University, Ansan, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Electrical Engineering, Hanyang University, Ansan, South Korea","institution_ids":["https://openalex.org/I4575257"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102076010","display_name":"Song Chong","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Song Chong","raw_affiliation_strings":["Graduate School of AI, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of AI, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.4238,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.80860043,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"29","issue":"2","first_page":"750","last_page":"763"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7465054988861084},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6015249490737915},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5948271155357361},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5330508947372437},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5199488401412964},{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.4782347083091736},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.4306488633155823},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.36998552083969116},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3481331467628479},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.25924795866012573},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20105478167533875}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7465054988861084},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6015249490737915},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5948271155357361},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5330508947372437},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5199488401412964},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.4782347083091736},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.4306488633155823},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.36998552083969116},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3481331467628479},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.25924795866012573},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20105478167533875},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tnet.2021.3051663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnet.2021.3051663","pdf_url":null,"source":{"id":"https://openalex.org/S62238642","display_name":"IEEE/ACM Transactions on Networking","issn_l":"1063-6692","issn":["1063-6692","1558-2566"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Networking","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W80012474","https://openalex.org/W107583932","https://openalex.org/W1518931405","https://openalex.org/W1599841949","https://openalex.org/W1757796397","https://openalex.org/W1966208686","https://openalex.org/W1969276875","https://openalex.org/W1984181498","https://openalex.org/W1986389067","https://openalex.org/W2003346154","https://openalex.org/W2009551863","https://openalex.org/W2010654234","https://openalex.org/W2029631728","https://openalex.org/W2030544250","https://openalex.org/W2038007012","https://openalex.org/W2049934117","https://openalex.org/W2070317877","https://openalex.org/W2082691056","https://openalex.org/W2101242010","https://openalex.org/W2105177639","https://openalex.org/W2109341366","https://openalex.org/W2119380668","https://openalex.org/W2120344179","https://openalex.org/W2129670787","https://openalex.org/W2135663206","https://openalex.org/W2137152139","https://openalex.org/W2138993731","https://openalex.org/W2145339207","https://openalex.org/W2150516182","https://openalex.org/W2161966552","https://openalex.org/W2164599584","https://openalex.org/W2165131254","https://openalex.org/W2165768656","https://openalex.org/W2173655337","https://openalex.org/W2327545172","https://openalex.org/W2400861403","https://openalex.org/W2489939061","https://openalex.org/W2553188523","https://openalex.org/W2562947506","https://openalex.org/W2565612488","https://openalex.org/W2596760110","https://openalex.org/W2741401130","https://openalex.org/W2756144809","https://openalex.org/W2763737552","https://openalex.org/W2784320632","https://openalex.org/W2911931139","https://openalex.org/W2950929549","https://openalex.org/W2963049774","https://openalex.org/W2963549123","https://openalex.org/W3044168612","https://openalex.org/W3093951152","https://openalex.org/W4253201987","https://openalex.org/W4285719527","https://openalex.org/W4297972233","https://openalex.org/W4298857966","https://openalex.org/W6603282716","https://openalex.org/W6604362843","https://openalex.org/W6635872325","https://openalex.org/W6637967152","https://openalex.org/W6675043515","https://openalex.org/W6683603353","https://openalex.org/W6729964979","https://openalex.org/W6747875335","https://openalex.org/W6752725515","https://openalex.org/W6758345023","https://openalex.org/W6769989166"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W1985560493","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894","https://openalex.org/W187740018"],"abstract_inverted_index":{"As":[0],"network":[1,15,43,66],"architecture":[2],"becomes":[3,18],"complex":[4],"and":[5,54,90],"the":[6,11,28,65,124,135,155,159,180,190],"user":[7],"requirement":[8],"gets":[9],"diverse,":[10],"role":[12],"of":[13,123,147,158,174],"efficient":[14,133],"resource":[16],"management":[17],"more":[19,132],"important.":[20],"However,":[21],"existing":[22],"throughput-optimal":[23],"scheduling":[24,44],"algorithms":[25,45],"such":[26],"as":[27,69],"max-weight":[29,181],"algorithm":[30,95,169,182],"suffer":[31],"from":[32,139],"poor":[33],"delay":[34,172],"performance.":[35],"In":[36],"this":[37,60],"paper,":[38],"we":[39,62,77,165],"present":[40],"reinforcement":[41,93],"learning-based":[42],"for":[46],"a":[47,70,79,92,114,145,171],"single-hop":[48],"downlink":[49],"scenario":[50],"which":[51,108,130],"achieve":[52],"throughput-optimality":[53],"converge":[55],"to":[56,176,179,200],"minimal":[57],"delay.":[58],"To":[59],"end,":[61],"first":[63],"formulate":[64],"optimization":[67],"problem":[68],"Markov":[71],"decision":[72],"process":[73],"(MDP)":[74],"problem.":[75,161],"Then,":[76],"introduce":[78],"new":[80],"state-action":[81],"value":[82],"function":[83],"called":[84,96],"Q":[85,97,191],"<sup":[86,98,149,192],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[87,99,150,193],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">+</sup>":[88,100,194],"-function":[89],"develop":[91],"learning":[94,115],"-learning":[101,195],"with":[102,141,196,209],"UCB":[103,142,197],"(Upper":[104],"Confidence":[105],"Bound)":[106],"exploration":[107,143,198],"guarantees":[109],"small":[110],"performance":[111],"loss":[112],"during":[113],"process.":[116],"We":[117,186],"also":[118,187],"derive":[119],"an":[120,201],"upper":[121],"bound":[122,138],"sample":[125],"complexity":[126],"in":[127],"our":[128,168],"algorithm,":[129],"is":[131,154],"than":[134,207],"best":[136],"known":[137],"Q-learning":[140,208],"by":[144],"factor":[146,157],"\u03b3":[148,153],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[151],"where":[152],"discount":[156],"MDP":[160],"Finally,":[162],"via":[163],"simulation,":[164],"verify":[166],"that":[167,189],"shows":[170],"reduction":[173],"up":[175],"40.8%":[177],"compared":[178],"over":[183],"various":[184],"scenarios.":[185],"show":[188],"converges":[199],"\u03b5-optimal":[202],"policy":[203],"10":[204],"times":[205],"faster":[206],"UCB.":[210]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
