{"id":"https://openalex.org/W4300680463","doi":"https://doi.org/10.1109/tnet.2022.3194953","title":"Delay-Oriented Scheduling in 5G Downlink Wireless Networks Based on Reinforcement Learning With Partial Observations","display_name":"Delay-Oriented Scheduling in 5G Downlink Wireless Networks Based on Reinforcement Learning With Partial Observations","publication_year":2022,"publication_date":"2022-08-05","ids":{"openalex":"https://openalex.org/W4300680463","doi":"https://doi.org/10.1109/tnet.2022.3194953"},"language":"en","primary_location":{"id":"doi:10.1109/tnet.2022.3194953","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnet.2022.3194953","pdf_url":null,"source":{"id":"https://openalex.org/S62238642","display_name":"IEEE/ACM Transactions on Networking","issn_l":"1063-6692","issn":["1063-6692","1558-2566"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053624922","display_name":"Yijun Hao","orcid":"https://orcid.org/0000-0001-7636-2786"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yijun Hao","raw_affiliation_strings":["National Engineering Laboratory for Big Data Analytics (NEL-BDA), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Laboratory for Big Data Analytics (NEL-BDA), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100394213","display_name":"Fang Li","orcid":"https://orcid.org/0000-0003-1477-3875"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fang Li","raw_affiliation_strings":["National Engineering Laboratory for Big Data Analytics (NEL-BDA), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Laboratory for Big Data Analytics (NEL-BDA), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037412714","display_name":"Cong Zhao","orcid":"https://orcid.org/0000-0002-9002-4350"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Cong Zhao","raw_affiliation_strings":["Department of Computing, Imperial College London, London, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Imperial College London, London, U.K","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067547680","display_name":"Shusen Yang","orcid":"https://orcid.org/0000-0002-4495-6237"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shusen Yang","raw_affiliation_strings":["National Engineering Laboratory for Big Data Analytics (NEL-BDA), Ministry of Education Key Laboratory for Intelligent Networks and Network Security (MOE KLINNS Laboratory), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","Industrial Artificial Intelligence Center, Pazhou Laboratory, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Laboratory for Big Data Analytics (NEL-BDA), Ministry of Education Key Laboratory for Intelligent Networks and Network Security (MOE KLINNS Laboratory), Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]},{"raw_affiliation_string":"Industrial Artificial Intelligence Center, Pazhou Laboratory, Guangzhou, China","institution_ids":["https://openalex.org/I4210100255"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053624922"],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":1.4637,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.81487639,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"31","issue":"1","first_page":"380","last_page":"394"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11158","display_name":"Wireless Networks and Protocols","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8655276298522949},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.752778172492981},{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.6938743591308594},{"id":"https://openalex.org/keywords/telecommunications-link","display_name":"Telecommunications link","score":0.6777150630950928},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5978403687477112},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5831257104873657},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.5180850028991699},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.4794239401817322},{"id":"https://openalex.org/keywords/network-packet","display_name":"Network packet","score":0.47926709055900574},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4388889968395233},{"id":"https://openalex.org/keywords/cellular-network","display_name":"Cellular network","score":0.4368610978126526},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.41063350439071655},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4097985029220581},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.39300161600112915},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.36150410771369934},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.2642660140991211},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.16567003726959229},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16248396039009094},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.13112518191337585}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8655276298522949},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.752778172492981},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.6938743591308594},{"id":"https://openalex.org/C138660444","wikidata":"https://www.wikidata.org/wiki/Q5607897","display_name":"Telecommunications link","level":2,"score":0.6777150630950928},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5978403687477112},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5831257104873657},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.5180850028991699},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.4794239401817322},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.47926709055900574},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4388889968395233},{"id":"https://openalex.org/C153646914","wikidata":"https://www.wikidata.org/wiki/Q535695","display_name":"Cellular network","level":2,"score":0.4368610978126526},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.41063350439071655},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4097985029220581},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.39300161600112915},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.36150410771369934},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.2642660140991211},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.16567003726959229},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16248396039009094},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.13112518191337585},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tnet.2022.3194953","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnet.2022.3194953","pdf_url":null,"source":{"id":"https://openalex.org/S62238642","display_name":"IEEE/ACM Transactions on Networking","issn_l":"1063-6692","issn":["1063-6692","1558-2566"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Networking","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1082092869","display_name":null,"funder_award_id":"2020T130513","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G1769842585","display_name":null,"funder_award_id":"2020YFA0713900","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2045660238","display_name":null,"funder_award_id":"61802298","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2066389582","display_name":null,"funder_award_id":"2019M663726","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G5234250448","display_name":null,"funder_award_id":"11690011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5372072380","display_name":null,"funder_award_id":"U1811461","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6727632337","display_name":null,"funder_award_id":"61772410","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7108580912","display_name":null,"funder_award_id":"62172329","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8698885527","display_name":null,"funder_award_id":"U21A6005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1689711448","https://openalex.org/W1977556410","https://openalex.org/W1982063824","https://openalex.org/W2011798739","https://openalex.org/W2022138967","https://openalex.org/W2027419845","https://openalex.org/W2054692642","https://openalex.org/W2094860320","https://openalex.org/W2108137967","https://openalex.org/W2108327442","https://openalex.org/W2112577169","https://openalex.org/W2159494247","https://openalex.org/W2291973609","https://openalex.org/W2328220946","https://openalex.org/W2343448572","https://openalex.org/W2492150193","https://openalex.org/W2559744077","https://openalex.org/W2605344455","https://openalex.org/W2736601468","https://openalex.org/W2747599906","https://openalex.org/W2762605243","https://openalex.org/W2784277076","https://openalex.org/W2788005034","https://openalex.org/W2890072063","https://openalex.org/W2890483234","https://openalex.org/W2890889532","https://openalex.org/W2920334458","https://openalex.org/W2945086780","https://openalex.org/W2962752580","https://openalex.org/W2962790412","https://openalex.org/W2962896678","https://openalex.org/W2963049774","https://openalex.org/W2963864421","https://openalex.org/W2964015378","https://openalex.org/W3105610356","https://openalex.org/W3126805270","https://openalex.org/W3160306825","https://openalex.org/W4239181556","https://openalex.org/W6638636849","https://openalex.org/W6677939520","https://openalex.org/W6683204974","https://openalex.org/W6684921986","https://openalex.org/W6692846177","https://openalex.org/W6696783566","https://openalex.org/W6726873649","https://openalex.org/W6741002519","https://openalex.org/W6752725515","https://openalex.org/W6757184387"],"related_works":["https://openalex.org/W2096013579","https://openalex.org/W52153049","https://openalex.org/W1760611253","https://openalex.org/W1589140671","https://openalex.org/W2951545791","https://openalex.org/W1515117609","https://openalex.org/W2294884454","https://openalex.org/W790449367","https://openalex.org/W4323315247","https://openalex.org/W3169161914"],"abstract_inverted_index":{"5G":[0,59,175],"wireless":[1],"networks":[2,61],"are":[3],"expected":[4],"to":[5,25,32,98,120,196],"satisfy":[6],"different":[7,129],"delay":[8,162,190,193],"requirements":[9],"of":[10,44,169,187],"various":[11],"traffics":[12],"by":[13,148],"network":[14,45],"resource":[15],"scheduling.":[16],"Existing":[17],"scheduling":[18,55,90],"methods":[19],"perform":[20],"poorly":[21],"in":[22,57,163,185],"practice":[23],"due":[24],"their":[26],"unrealistic":[27],"assumption":[28],"on":[29,93,172],"the":[30,33,40,52,101,106,122,133,143,157],"access":[31],"full":[34,107],"channel":[35,108],"state":[36,124],"information":[37,146],"(CSI)":[38],"or":[39],"explicit":[41],"mathematical":[42],"expression":[43],"delay.":[46],"In":[47],"this":[48],"paper,":[49],"we":[50],"consider":[51],"delay-oriented":[53,88],"packet":[54],"problem":[56],"multi-cell":[58,165],"downlink":[60,89],"with":[62,132],"multiple":[63],"users":[64],"and":[65,71,74,125,159,191,198],"traffic":[66,103,145],"types":[67],"(e.g.,":[68],"FTP,":[69],"VoIP":[70],"video":[72],"streaming),":[73],"formulate":[75],"it":[76],"as":[77],"a":[78,87,111,149,173],"partially":[79],"observable":[80],"Markov":[81],"decision":[82],"process":[83],"(POMDP).":[84],"We":[85],"design":[86],"framework":[91,180],"based":[92],"deep":[94],"reinforcement":[95],"learning":[96,127],"(DRL)":[97],"autonomously":[99],"schedule":[100],"active":[102],"flows":[104],"without":[105],"information.":[109],"Furthermore,":[110],"recurrent":[112],"proximal":[113],"policy":[114,134],"optimization":[115],"(RPPO)":[116],"algorithm":[117],"is":[118],"proposed":[119,150],"perceive":[121],"underlying":[123],"accelerate":[126],"under":[128,137],"time":[130],"granularities,":[131],"gradient":[135],"theorem":[136],"POMDP":[138],"strictly":[139],"proved.":[140],"By":[141],"incorporating":[142],"future":[144],"provided":[147],"spatial-temporal":[151],"prediction":[152],"algorithm,":[153],"RPPO":[154],"can":[155],"balance":[156],"load":[158],"achieve":[160],"lower":[161],"real-time":[164],"multi-user":[166],"scenarios.":[167],"Results":[168],"extensive":[170],"experiments":[171],"realistic":[174],"simulator":[176],"demonstrate":[177],"that":[178],"our":[179],"significantly":[181],"outperforms":[182],"existing":[183],"approaches":[184],"terms":[186],"both":[188],"tail":[189],"average":[192],"for":[194],"up":[195],"48%":[197],"41.7%,":[199],"respectively.":[200]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
