{"id":"https://openalex.org/W4205984388","doi":"https://doi.org/10.1109/jstsp.2022.3143488","title":"Joint Beam Training and Data Transmission Control for mmWave Delay-Sensitive Communications: A Parallel Reinforcement Learning Approach","display_name":"Joint Beam Training and Data Transmission Control for mmWave Delay-Sensitive Communications: A Parallel Reinforcement Learning Approach","publication_year":2022,"publication_date":"2022-01-14","ids":{"openalex":"https://openalex.org/W4205984388","doi":"https://doi.org/10.1109/jstsp.2022.3143488"},"language":"en","primary_location":{"id":"doi:10.1109/jstsp.2022.3143488","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2022.3143488","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052823220","display_name":"Wanlu Lei","orcid":"https://orcid.org/0000-0002-9878-3722"},"institutions":[{"id":"https://openalex.org/I1306339040","display_name":"Ericsson (Sweden)","ror":"https://ror.org/05a7rhx54","country_code":"SE","type":"company","lineage":["https://openalex.org/I1306339040"]},{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Wanlu Lei","raw_affiliation_strings":["Ericsson AB, Stockholm, Sweden","Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0002-9878-3722","affiliations":[{"raw_affiliation_string":"Ericsson AB, Stockholm, Sweden","institution_ids":["https://openalex.org/I1306339040"]},{"raw_affiliation_string":"Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090707691","display_name":"Deyou Zhang","orcid":"https://orcid.org/0000-0001-9621-561X"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Deyou Zhang","raw_affiliation_strings":["Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-9621-561X","affiliations":[{"raw_affiliation_string":"Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100421130","display_name":"Yu Ye","orcid":"https://orcid.org/0000-0003-4686-0973"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Yu Ye","raw_affiliation_strings":["Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0003-4686-0973","affiliations":[{"raw_affiliation_string":"Division of Information Science and Engineering, KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002379058","display_name":"Chenguang Lu","orcid":"https://orcid.org/0000-0001-7798-5416"},"institutions":[{"id":"https://openalex.org/I1306339040","display_name":"Ericsson (Sweden)","ror":"https://ror.org/05a7rhx54","country_code":"SE","type":"company","lineage":["https://openalex.org/I1306339040"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Chenguang Lu","raw_affiliation_strings":["Ericsson Research, Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-7798-5416","affiliations":[{"raw_affiliation_string":"Ericsson Research, Stockholm, Sweden","institution_ids":["https://openalex.org/I1306339040"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5052823220"],"corresponding_institution_ids":["https://openalex.org/I1306339040","https://openalex.org/I86987016"],"apc_list":null,"apc_paid":null,"fwci":1.2008,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.771165,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"16","issue":"3","first_page":"447","last_page":"459"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10936","display_name":"Millimeter-Wave Propagation and Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10936","display_name":"Millimeter-Wave Propagation and Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10262","display_name":"Microwave Engineering and Waveguides","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7929725646972656},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7724512219429016},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.747347354888916},{"id":"https://openalex.org/keywords/transmission-delay","display_name":"Transmission delay","score":0.625828742980957},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.6061826944351196},{"id":"https://openalex.org/keywords/lagrange-multiplier","display_name":"Lagrange multiplier","score":0.5537689924240112},{"id":"https://openalex.org/keywords/transmission","display_name":"Transmission (telecommunications)","score":0.5074517130851746},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4834176301956177},{"id":"https://openalex.org/keywords/data-transmission","display_name":"Data transmission","score":0.47732120752334595},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3995448350906372},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.33939215540885925},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3072279095649719},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.25037527084350586},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.20211821794509888},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1327309012413025},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0966235101222992}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7929725646972656},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7724512219429016},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.747347354888916},{"id":"https://openalex.org/C108921912","wikidata":"https://www.wikidata.org/wiki/Q7834639","display_name":"Transmission delay","level":3,"score":0.625828742980957},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.6061826944351196},{"id":"https://openalex.org/C73684929","wikidata":"https://www.wikidata.org/wiki/Q598870","display_name":"Lagrange multiplier","level":2,"score":0.5537689924240112},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.5074517130851746},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4834176301956177},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.47732120752334595},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3995448350906372},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.33939215540885925},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3072279095649719},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.25037527084350586},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.20211821794509888},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1327309012413025},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0966235101222992},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jstsp.2022.3143488","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2022.3143488","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.9100000262260437,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W948366128","https://openalex.org/W1514588745","https://openalex.org/W1930400786","https://openalex.org/W1941445455","https://openalex.org/W2034651337","https://openalex.org/W2066798397","https://openalex.org/W2104074482","https://openalex.org/W2111953900","https://openalex.org/W2116334496","https://openalex.org/W2123117904","https://openalex.org/W2261663070","https://openalex.org/W2294344867","https://openalex.org/W2604992528","https://openalex.org/W2615358882","https://openalex.org/W2751147412","https://openalex.org/W2799206304","https://openalex.org/W2891787690","https://openalex.org/W2896890603","https://openalex.org/W2947007362","https://openalex.org/W2962691384","https://openalex.org/W2963461637","https://openalex.org/W2963652863","https://openalex.org/W2969788250","https://openalex.org/W2998463968","https://openalex.org/W3016754131","https://openalex.org/W3043521615","https://openalex.org/W3099147043","https://openalex.org/W3108957811","https://openalex.org/W3178091145","https://openalex.org/W4206497039","https://openalex.org/W4288574671","https://openalex.org/W4300773225","https://openalex.org/W6759127422","https://openalex.org/W6774246582"],"related_works":["https://openalex.org/W1600454385","https://openalex.org/W1997033546","https://openalex.org/W2074745806","https://openalex.org/W3120556963","https://openalex.org/W1979241556","https://openalex.org/W2370558260","https://openalex.org/W2157978609","https://openalex.org/W2162286586","https://openalex.org/W4255368532","https://openalex.org/W2568536464"],"abstract_inverted_index":{"Future":[0],"communication":[1],"networks":[2],"call":[3],"for":[4,75],"new":[5],"solutions":[6],"to":[7,50,98],"support":[8],"their":[9],"capacity":[10],"and":[11,53,71,161],"delay":[12,112,162],"demands":[13],"by":[14],"leveraging":[15],"potentials":[16],"of":[17,67,109],"the":[18,25,65,83,100,105,121,147],"millimeter":[19],"wave":[20],"(mmWave)":[21],"frequency":[22],"band.":[23],"However,":[24],"beam":[26,69],"training":[27,70],"procedure":[28],"in":[29,79,138,157],"mmWave":[30,58,76],"systems":[31],"incurs":[32],"significant":[33],"overhead":[34],"as":[35,37,89],"well":[36],"huge":[38],"energy":[39,102,159],"consumption.":[40],"As":[41],"such,":[42],"deriving":[43],"an":[44,125],"adaptive":[45],"control":[46,74],"policy":[47,149],"is":[48,86,129],"beneficial":[49],"both":[51,158],"delay-sensitive":[52,77],"energy-efficient":[54],"data":[55,72],"transmission":[56,73],"over":[57,104],"networks.":[59],"To":[60],"this":[61,80],"end,":[62],"we":[63,119],"investigate":[64],"problem":[66,85],"joint":[68],"communications":[78],"paper.":[81],"Specifically,":[82],"considered":[84,107],"firstly":[87],"formulated":[88],"a":[90,116,133,139],"constrained":[91,122],"Markov":[92],"Decision":[93],"Process":[94],"(MDP),":[95],"which":[96,128],"aims":[97],"minimize":[99],"cumulative":[101],"consumption":[103,160],"whole":[106],"period":[108],"time":[110],"under":[111],"constraint.":[113],"By":[114],"introducing":[115],"Lagrange":[117],"multiplier,":[118],"transform":[120],"MDP":[123],"into":[124],"unconstrained":[126],"one,":[127],"then":[130],"solved":[131],"via":[132,150],"parallel-rollout-based":[134],"reinforcement":[135],"learning":[136],"method":[137],"data-driven":[140],"manner.":[141],"Our":[142],"numerical":[143],"results":[144],"demonstrate":[145],"that":[146],"optimized":[148],"parallel-rollout":[151],"significantly":[152],"outperforms":[153],"other":[154],"baseline":[155],"policies":[156],"performance.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":6}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
