{"id":"https://openalex.org/W4289713084","doi":"https://doi.org/10.1109/netsoft54395.2022.9844032","title":"On the Training of Reinforcement Learning-based Algorithms in 5G and Beyond Radio Access Networks","display_name":"On the Training of Reinforcement Learning-based Algorithms in 5G and Beyond Radio Access Networks","publication_year":2022,"publication_date":"2022-06-27","ids":{"openalex":"https://openalex.org/W4289713084","doi":"https://doi.org/10.1109/netsoft54395.2022.9844032"},"language":"en","primary_location":{"id":"doi:10.1109/netsoft54395.2022.9844032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/netsoft54395.2022.9844032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 8th International Conference on Network Softwarization (NetSoft)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063676343","display_name":"Irene Vil\u00e0","orcid":"https://orcid.org/0000-0002-7086-9591"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"I. Vila","raw_affiliation_strings":["Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034523211","display_name":"J. P\u00e9rez-Romero","orcid":"https://orcid.org/0000-0001-9131-5013"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"J. Perez-Romero","raw_affiliation_strings":["Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048114047","display_name":"O. Sallent","orcid":"https://orcid.org/0000-0002-2114-1406"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"O. Sallent","raw_affiliation_strings":["Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Polit&#x00E8;cnica de Catalunya (UPC),Dept. of Signal Theory and Communications,Barcelona,Spain","institution_ids":["https://openalex.org/I9617848"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5063676343"],"corresponding_institution_ids":["https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":0.3684,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.57079851,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"207","last_page":"215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8521100282669067},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7921919822692871},{"id":"https://openalex.org/keywords/retraining","display_name":"Retraining","score":0.5905306339263916},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5868891477584839},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5406996011734009},{"id":"https://openalex.org/keywords/radio-access-network","display_name":"Radio access network","score":0.5315097570419312},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.48588889837265015},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4690568745136261},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.44949787855148315},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.43066734075546265},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.35292166471481323},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.31179550290107727},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.13835299015045166},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12208271026611328}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8521100282669067},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7921919822692871},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.5905306339263916},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5868891477584839},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5406996011734009},{"id":"https://openalex.org/C106365562","wikidata":"https://www.wikidata.org/wiki/Q3078360","display_name":"Radio access network","level":4,"score":0.5315097570419312},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.48588889837265015},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4690568745136261},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.44949787855148315},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.43066734075546265},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.35292166471481323},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.31179550290107727},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.13835299015045166},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12208271026611328},{"id":"https://openalex.org/C207029474","wikidata":"https://www.wikidata.org/wiki/Q384018","display_name":"Mobile station","level":3,"score":0.0},{"id":"https://openalex.org/C155202549","wikidata":"https://www.wikidata.org/wiki/Q178803","display_name":"International trade","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/netsoft54395.2022.9844032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/netsoft54395.2022.9844032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 8th International Conference on Network Softwarization (NetSoft)","raw_type":"proceedings-article"},{"id":"pmh:oai:upcommons.upc.edu:2117/380800","is_oa":false,"landing_page_url":"http://hdl.handle.net/2117/380800","pdf_url":null,"source":{"id":"https://openalex.org/S4377196262","display_name":"UPCommons institutional repository (Universitat Polit\u00e8cnica de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9617848","host_organization_name":"Universitat Polit\u00e8cnica de Catalunya","host_organization_lineage":["https://openalex.org/I9617848"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.47999998927116394,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2287583104","https://openalex.org/W2800319120","https://openalex.org/W2807731816","https://openalex.org/W2891171329","https://openalex.org/W2950863887","https://openalex.org/W2951157784","https://openalex.org/W2961380111","https://openalex.org/W2962883549","https://openalex.org/W2968563287","https://openalex.org/W2999146029","https://openalex.org/W3016185400","https://openalex.org/W3017571569","https://openalex.org/W3022566517","https://openalex.org/W3088310808","https://openalex.org/W3098133185","https://openalex.org/W3100707094","https://openalex.org/W3120778962","https://openalex.org/W3184222766","https://openalex.org/W4210979451","https://openalex.org/W4214717370","https://openalex.org/W6677916085","https://openalex.org/W6776438516","https://openalex.org/W6893815513"],"related_works":["https://openalex.org/W2081982437","https://openalex.org/W4394857231","https://openalex.org/W2027050655","https://openalex.org/W3028244590","https://openalex.org/W4254349500","https://openalex.org/W2014369232","https://openalex.org/W3122042562","https://openalex.org/W2050078012","https://openalex.org/W2060761133","https://openalex.org/W2360307734"],"abstract_inverted_index":{"Reinforcement":[0],"Learning":[1],"(RL)-based":[2],"algorithmic":[3],"solutions":[4],"have":[5,26],"been":[6],"profusely":[7],"proposed":[8,118,150],"in":[9,16,63,104,127],"recent":[10],"years":[11],"for":[12,30,59,81,138],"addressing":[13],"multiple":[14],"problems":[15],"the":[17,48,64,71,85,89,92,96,99,105,109,149],"Radio":[18],"Access":[19],"Network":[20],"(RAN).":[21],"However,":[22],"how":[23],"RL":[24,61],"algorithms":[25],"to":[27,94,111],"be":[28],"trained":[29,100],"a":[31,56,113,123,134],"successful":[32],"exploitation":[33],"has":[34],"not":[35],"received":[36],"sufficient":[37],"attention.":[38],"To":[39],"address":[40],"this":[41,53],"limitation,":[42],"which":[43],"is":[44,68,120],"particularly":[45],"relevant":[46,124],"given":[47],"peculiarities":[49],"of":[50,87,98,148],"wireless":[51],"communications,":[52],"paper":[54],"proposes":[55],"functional":[57],"framework":[58,67,119,151],"training":[60,90],"strategies":[62],"RAN.":[65],"The":[66,117],"aligned":[69],"with":[70,122],"O-RAN":[72],"Alliance":[73],"machine":[74],"learning":[75],"workflow":[76],"and":[77,108],"introduces":[78],"specific":[79],"functionalities":[80],"RL,":[82],"such":[83],"as":[84],"way":[86],"specifying":[88],"datasets,":[91],"mechanisms":[93],"monitor":[95],"performance":[97],"policies":[101],"during":[102],"inference":[103],"real":[106],"network,":[107],"capability":[110],"conduct":[112],"retraining":[114],"if":[115],"necessary.":[116],"illustrated":[121],"use":[125],"case":[126],"5G,":[128],"namely":[129],"RAN":[130],"slicing,":[131],"by":[132],"considering":[133],"Deep":[135],"Q-Network":[136],"algorithm":[137],"capacity":[139],"sharing.":[140],"Finally,":[141],"insights":[142],"on":[143],"other":[144],"possible":[145],"applicability":[146],"examples":[147],"are":[152],"provided.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2022-08-04T00:00:00"}
