{"id":"https://openalex.org/W4417201783","doi":"https://doi.org/10.1109/tcomm.2025.3642701","title":"Fast Reinforcement Learning for Robust Beam Codebooks in Future Communication Systems","display_name":"Fast Reinforcement Learning for Robust Beam Codebooks in Future Communication Systems","publication_year":2025,"publication_date":"2025-12-10","ids":{"openalex":"https://openalex.org/W4417201783","doi":"https://doi.org/10.1109/tcomm.2025.3642701"},"language":null,"primary_location":{"id":"doi:10.1109/tcomm.2025.3642701","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcomm.2025.3642701","pdf_url":null,"source":{"id":"https://openalex.org/S196647941","display_name":"IEEE Transactions on Communications","issn_l":"0090-6778","issn":["0090-6778","1558-0857"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Communications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1109/tcomm.2025.3642701","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033586394","display_name":"Anouar Nechi","orcid":"https://orcid.org/0000-0001-9680-6145"},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Anouar Nechi","raw_affiliation_strings":["Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","institution_ids":["https://openalex.org/I2799978770"]},{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120743640","display_name":"Zakaria Narjis","orcid":"https://orcid.org/0009-0007-7033-4419"},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Zakaria Narjis","raw_affiliation_strings":["Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","institution_ids":["https://openalex.org/I2799978770"]},{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070129711","display_name":"Rainer Buchty","orcid":"https://orcid.org/0009-0004-9413-2078"},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rainer Buchty","raw_affiliation_strings":["Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","institution_ids":["https://openalex.org/I2799978770"]},{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039777488","display_name":"Mladen Berekovi\u0107","orcid":"https://orcid.org/0000-0003-1911-756X"},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Mladen Berekovic","raw_affiliation_strings":["Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","institution_ids":["https://openalex.org/I2799978770"]},{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024325751","display_name":"Saleh Mulhem","orcid":"https://orcid.org/0000-0001-7380-5270"},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Saleh Mulhem","raw_affiliation_strings":["Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, L&#x00FC;beck, Schleswig-Holstein, Germany","institution_ids":["https://openalex.org/I2799978770"]},{"raw_affiliation_string":"Institute of Computer Engineering, Universit&#x00E4;t zu L&#x00FC;beck, Germany","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5033586394"],"corresponding_institution_ids":["https://openalex.org/I2799978770"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38893477,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"74","issue":null,"first_page":"1967","last_page":"1983"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10936","display_name":"Millimeter-Wave Propagation and Modeling","score":0.978600025177002,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10936","display_name":"Millimeter-Wave Propagation and Modeling","score":0.978600025177002,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.0142000000923872,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.002400000113993883,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.9128000140190125},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8116000294685364},{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.7261000275611877},{"id":"https://openalex.org/keywords/mimo","display_name":"MIMO","score":0.5907999873161316},{"id":"https://openalex.org/keywords/communications-system","display_name":"Communications system","score":0.5019999742507935},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4433000087738037},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.36160001158714294},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.34450000524520874}],"concepts":[{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.9128000140190125},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8116000294685364},{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.7261000275611877},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6747999787330627},{"id":"https://openalex.org/C207987634","wikidata":"https://www.wikidata.org/wiki/Q176862","display_name":"MIMO","level":3,"score":0.5907999873161316},{"id":"https://openalex.org/C101765175","wikidata":"https://www.wikidata.org/wiki/Q577764","display_name":"Communications system","level":2,"score":0.5019999742507935},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4433000087738037},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.41830000281333923},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3571000099182129},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.34450000524520874},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.3271999955177307},{"id":"https://openalex.org/C168834538","wikidata":"https://www.wikidata.org/wiki/Q3705329","display_name":"Beam (structure)","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.31940001249313354},{"id":"https://openalex.org/C45764600","wikidata":"https://www.wikidata.org/wiki/Q570342","display_name":"Extremely high frequency","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C40409654","wikidata":"https://www.wikidata.org/wiki/Q375889","display_name":"Orthogonal frequency-division multiplexing","level":3,"score":0.28679999709129333},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C138660444","wikidata":"https://www.wikidata.org/wiki/Q5607897","display_name":"Telecommunications link","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C89061704","wikidata":"https://www.wikidata.org/wiki/Q5555726","display_name":"Frequency-division multiplexing","level":4,"score":0.2750999927520752},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2685000002384186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.267300009727478},{"id":"https://openalex.org/C2781327853","wikidata":"https://www.wikidata.org/wiki/Q3552547","display_name":"User equipment","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2596000134944916},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.25920000672340393},{"id":"https://openalex.org/C154910267","wikidata":"https://www.wikidata.org/wiki/Q1740982","display_name":"Non-line-of-sight propagation","level":3,"score":0.25780001282691956},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.25290000438690186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcomm.2025.3642701","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcomm.2025.3642701","pdf_url":null,"source":{"id":"https://openalex.org/S196647941","display_name":"IEEE Transactions on Communications","issn_l":"0090-6778","issn":["0090-6778","1558-0857"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Communications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/tcomm.2025.3642701","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcomm.2025.3642701","pdf_url":null,"source":{"id":"https://openalex.org/S196647941","display_name":"IEEE Transactions on Communications","issn_l":"0090-6778","issn":["0090-6778","1558-0857"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Communications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8178873707","display_name":null,"funder_award_id":"403579441","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1956027752","https://openalex.org/W1974598214","https://openalex.org/W2034651337","https://openalex.org/W2074863717","https://openalex.org/W2075148031","https://openalex.org/W2111953900","https://openalex.org/W2134383396","https://openalex.org/W2166486216","https://openalex.org/W2167319728","https://openalex.org/W2195693430","https://openalex.org/W2222512263","https://openalex.org/W2261663070","https://openalex.org/W2567050201","https://openalex.org/W2929985644","https://openalex.org/W2958261239","https://openalex.org/W2991478545","https://openalex.org/W3037339607","https://openalex.org/W3046928693","https://openalex.org/W3169551415","https://openalex.org/W3212407382","https://openalex.org/W4225663377","https://openalex.org/W4226227715","https://openalex.org/W4255949318","https://openalex.org/W4310174457","https://openalex.org/W4387880310","https://openalex.org/W4390576588"],"related_works":[],"abstract_inverted_index":{"Millimeter":[0],"wave":[1],"(mmWave)":[2],"and":[3,17,33,67,93,124,161,167,174],"terahertz":[4],"(THz)":[5],"MIMO":[6],"systems":[7,134],"typically":[8],"rely":[9],"on":[10],"predefined":[11],"beamforming":[12,159],"codebooks":[13,22],"for":[14,26,41,103,127],"initial":[15],"access":[16],"data":[18],"transmission.":[19],"However,":[20],"these":[21],"are":[23],"often":[24],"unoptimized":[25],"specific":[27],"conditions,":[28,176],"leading":[29],"to":[30,62,165],"large":[31],"sizes":[32],"significant":[34],"beam":[35,54,129],"training":[36],"overhead,":[37],"thereby":[38],"complicating":[39],"support":[40],"highly":[42],"mobile":[43],"applications.":[44],"This":[45,139],"paper":[46,140],"introduces":[47],"a":[48,105,114],"reinforcement":[49,78,98],"learning":[50,79,99],"framework":[51,75],"that":[52],"optimizes":[53],"patterns":[55],"using":[56],"only":[57],"receive":[58],"power":[59],"measurements,":[60],"adapting":[61],"the":[63,142,151,154],"environment,":[64],"user":[65],"distribution,":[66],"hardware":[68,125,179],"constraints":[69],"without":[70],"prior":[71],"channel":[72],"knowledge.":[73],"The":[74],"explores":[76],"three":[77],"algorithms:":[80],"Deep":[81,88],"Deterministic":[82,89],"Policy":[83,90],"Gradient":[84,91],"(DDPG),":[85],"Twin":[86],"Delayed":[87],"(TD3),":[92],"Soft":[94],"Actor-Critic":[95],"(SAC).":[96],"While":[97],"has":[100,135],"shown":[101],"promise":[102],"beamforming,":[104],"comprehensive":[106],"comparative":[107,146],"analysis":[108],"of":[109,116,153],"advanced":[110],"RL":[111],"algorithms":[112],"under":[113],"combination":[115],"realistic":[117],"challenges,":[118],"such":[119,144],"as":[120],"Non-Line-of-Sight":[121],"(NLoS)":[122],"conditions":[123],"impairments":[126],"adaptive":[128],"codebook":[130],"design":[131],"in":[132,169],"mmWave/THz":[133],"been":[136],"largely":[137],"unexplored.":[138],"presents":[141],"first":[143],"in-depth":[145],"study.":[147],"Simulation":[148],"results":[149],"demonstrate":[150],"superiority":[152],"SAC":[155],"algorithm,":[156],"achieving":[157],"higher":[158],"gain":[160],"faster":[162],"convergence":[163],"compared":[164],"DDPG":[166],"TD3":[168],"various":[170],"scenarios,":[171],"including":[172],"LoS":[173],"NLoS":[175],"even":[177],"with":[178],"impairments.":[180]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-12-10T00:00:00"}
