{"id":"https://openalex.org/W3198479314","doi":"https://doi.org/10.1109/globecom46510.2021.9685702","title":"Deep Reinforcement Learning for Wireless Resource Allocation Using Buffer State Information","display_name":"Deep Reinforcement Learning for Wireless Resource Allocation Using Buffer State Information","publication_year":2021,"publication_date":"2021-12-01","ids":{"openalex":"https://openalex.org/W3198479314","doi":"https://doi.org/10.1109/globecom46510.2021.9685702","mag":"3198479314"},"language":"en","primary_location":{"id":"doi:10.1109/globecom46510.2021.9685702","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom46510.2021.9685702","pdf_url":null,"source":{"id":"https://openalex.org/S4363607714","display_name":"2021 IEEE Global Communications Conference (GLOBECOM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Global Communications Conference (GLOBECOM)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2108.12198","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039320529","display_name":"Eike-Manuel Bansbach","orcid":null},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Eike-Manuel Bansbach","raw_affiliation_strings":["Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","Karlsruhe Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]},{"raw_affiliation_string":"Karlsruhe Institute of Technology","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031923248","display_name":"Victor Eliachevitch","orcid":null},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Victor Eliachevitch","raw_affiliation_strings":["Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053280913","display_name":"Laurent Schmalen","orcid":"https://orcid.org/0000-0002-1459-9128"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Laurent Schmalen","raw_affiliation_strings":["Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Communications Engineering Lab, Karlsruhe Institute of Technology (KIT), Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5039320529"],"corresponding_institution_ids":["https://openalex.org/I102335020"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10423985,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11158","display_name":"Wireless Networks and Protocols","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8226428031921387},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7979949712753296},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.5521449446678162},{"id":"https://openalex.org/keywords/orthogonal-frequency-division-multiple-access","display_name":"Orthogonal frequency-division multiple access","score":0.539078950881958},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5367336273193359},{"id":"https://openalex.org/keywords/network-packet","display_name":"Network packet","score":0.5326366424560547},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4948553442955017},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.48227694630622864},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.46126702427864075},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4455564022064209},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.4260326325893402},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4194942116737366},{"id":"https://openalex.org/keywords/convex-optimization","display_name":"Convex optimization","score":0.41581037640571594},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.41108548641204834},{"id":"https://openalex.org/keywords/orthogonal-frequency-division-multiplexing","display_name":"Orthogonal frequency-division multiplexing","score":0.29555052518844604},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2240065336227417},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.18740132451057434},{"id":"https://openalex.org/keywords/regular-polygon","display_name":"Regular polygon","score":0.11952018737792969},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08453428745269775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8226428031921387},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7979949712753296},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.5521449446678162},{"id":"https://openalex.org/C2775907427","wikidata":"https://www.wikidata.org/wiki/Q2697649","display_name":"Orthogonal frequency-division multiple access","level":4,"score":0.539078950881958},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5367336273193359},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.5326366424560547},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4948553442955017},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.48227694630622864},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.46126702427864075},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4455564022064209},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.4260326325893402},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4194942116737366},{"id":"https://openalex.org/C157972887","wikidata":"https://www.wikidata.org/wiki/Q463359","display_name":"Convex optimization","level":3,"score":0.41581037640571594},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41108548641204834},{"id":"https://openalex.org/C40409654","wikidata":"https://www.wikidata.org/wiki/Q375889","display_name":"Orthogonal frequency-division multiplexing","level":3,"score":0.29555052518844604},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2240065336227417},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.18740132451057434},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.11952018737792969},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08453428745269775},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/globecom46510.2021.9685702","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom46510.2021.9685702","pdf_url":null,"source":{"id":"https://openalex.org/S4363607714","display_name":"2021 IEEE Global Communications Conference (GLOBECOM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Global Communications Conference (GLOBECOM)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2108.12198","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.12198","pdf_url":"https://arxiv.org/pdf/2108.12198","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3198479314","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/2108.12198.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2108.12198","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2108.12198","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2108.12198","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.12198","pdf_url":"https://arxiv.org/pdf/2108.12198","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3198479314.pdf","grobid_xml":"https://content.openalex.org/works/W3198479314.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1503398984","https://openalex.org/W1983850919","https://openalex.org/W1990022790","https://openalex.org/W2101413281","https://openalex.org/W2116456097","https://openalex.org/W2121863487","https://openalex.org/W2159715570","https://openalex.org/W2159777336","https://openalex.org/W2171121903","https://openalex.org/W2782068308","https://openalex.org/W2789517807","https://openalex.org/W2898035736","https://openalex.org/W2909125469","https://openalex.org/W2963250023","https://openalex.org/W2969482782","https://openalex.org/W2994992444","https://openalex.org/W3034687650","https://openalex.org/W3036196187","https://openalex.org/W4240896209","https://openalex.org/W6683969366","https://openalex.org/W6748440607"],"related_works":["https://openalex.org/W3152685233","https://openalex.org/W2949886190","https://openalex.org/W3006896224","https://openalex.org/W2244504972","https://openalex.org/W2989655684","https://openalex.org/W3043667852","https://openalex.org/W3099495391","https://openalex.org/W3089655738","https://openalex.org/W3044319949","https://openalex.org/W2044988590","https://openalex.org/W3200625507","https://openalex.org/W3036013485","https://openalex.org/W3134370868","https://openalex.org/W2808620133","https://openalex.org/W2767873707","https://openalex.org/W2314391035","https://openalex.org/W3009197653","https://openalex.org/W2769139748","https://openalex.org/W2767141265","https://openalex.org/W2764870837"],"abstract_inverted_index":{"As":[0],"the":[1,18,42,56,75,107,131,134,159],"number":[2],"of":[3,77,90,99,133],"user":[4],"equipments":[5],"(UEs)":[6],"with":[7],"various":[8],"data":[9,44],"rate":[10,45],"and":[11,68,126,138,146],"latency":[12],"requirements":[13,33],"increases":[14],"in":[15],"wireless":[16,144],"networks,":[17],"resource":[19],"allocation":[20],"problem":[21,39,59],"for":[22,82],"orthogonal":[23],"frequency-division":[24],"multiple":[25],"access":[26,79],"(OFDMA)":[27],"becomes":[28],"challenging.":[29],"In":[30,51],"particular,":[31],"varying":[32],"lead":[34],"to":[35],"a":[36,70,83],"non-convex":[37,57],"optimization":[38,58],"when":[40],"maximizing":[41],"systems":[43],"while":[46],"preserving":[47],"fairness":[48],"between":[49],"UEs.":[50],"this":[52],"paper,":[53],"we":[54,93],"solve":[55],"using":[60,142],"deep":[61],"reinforcement":[62],"learning":[63],"(DRL).":[64],"We":[65,136,152],"outline,":[66],"train":[67,137],"evaluate":[69,139,147],"DRL":[71],"agent,":[72,92],"which":[73],"performs":[74],"task":[76],"media":[78],"control":[80],"scheduling":[81,100],"downlink":[84],"OFDMA":[85],"scenario.":[86],"To":[87],"kickstart":[88],"training":[89],"our":[91,140,155],"introduce":[94],"mimicking":[95],"learning.":[96],"For":[97],"improvement":[98],"performance,":[101],"full":[102],"buffer":[103],"state":[104],"information":[105],"at":[106],"base":[108],"station":[109],"(e.g.":[110],"packet":[111,113,124],"age,":[112],"size)":[114],"is":[115],"taken":[116],"into":[117],"account.":[118],"Techniques":[119],"like":[120],"input":[121],"feature":[122],"compression,":[123],"shuffling":[125],"age":[127],"capping":[128],"further":[129],"improve":[130],"performance":[132],"agent.":[135],"agents":[141,156],"Nokia&#x0027;s":[143],"suite":[145],"against":[148],"different":[149],"benchmark":[150,160],"agents.":[151,161],"show":[153],"that":[154],"clearly":[157],"outperform":[158]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
