{"id":"https://openalex.org/W4412939456","doi":"https://doi.org/10.1109/twc.2025.3592854","title":"Hierarchical Reinforcement Learning-Based Beam Selection for Integrated Sensing and Communication Systems","display_name":"Hierarchical Reinforcement Learning-Based Beam Selection for Integrated Sensing and Communication Systems","publication_year":2025,"publication_date":"2025-08-04","ids":{"openalex":"https://openalex.org/W4412939456","doi":"https://doi.org/10.1109/twc.2025.3592854"},"language":"en","primary_location":{"id":"doi:10.1109/twc.2025.3592854","is_oa":false,"landing_page_url":"https://doi.org/10.1109/twc.2025.3592854","pdf_url":null,"source":{"id":"https://openalex.org/S63459445","display_name":"IEEE Transactions on Wireless Communications","issn_l":"1536-1276","issn":["1536-1276","1558-2248"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Wireless Communications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086024904","display_name":"Ruming Yang","orcid":"https://orcid.org/0000-0001-6119-613X"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruming Yang","raw_affiliation_strings":["National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-6119-613X","affiliations":[{"raw_affiliation_string":"National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073379430","display_name":"Xingkang Li","orcid":"https://orcid.org/0009-0002-1162-8349"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingkang Li","raw_affiliation_strings":["National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0002-1162-8349","affiliations":[{"raw_affiliation_string":"National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056225611","display_name":"Yongming Huang","orcid":"https://orcid.org/0009-0009-2545-2875"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongming Huang","raw_affiliation_strings":["National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-3616-4616","affiliations":[{"raw_affiliation_string":"National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045457613","display_name":"L\u00fcxi Yang","orcid":"https://orcid.org/0000-0003-1474-1806"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Luxi Yang","raw_affiliation_strings":["National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-1474-1806","affiliations":[{"raw_affiliation_string":"National Mobile Communications Research Laboratory, School of Information Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Information Science and Engineering, National Mobile Communications Research Laboratory, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100653327","display_name":"Wei Zhang","orcid":"https://orcid.org/0000-0002-1059-3642"},"institutions":[{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]},{"id":"https://openalex.org/I4210155350","display_name":"Purple Mountain Laboratories","ror":"https://ror.org/04zcbk583","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210155350"]}],"countries":["AU","CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["School of Electrical Engineering and Telecommunications, University of New South Wales, Sydney, NSW, Australia","Purple Mountain Laboratories, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-1059-3642","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Telecommunications, University of New South Wales, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I31746571"]},{"raw_affiliation_string":"Purple Mountain Laboratories, Nanjing, China","institution_ids":["https://openalex.org/I4210155350"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5086024904"],"corresponding_institution_ids":["https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16356747,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"25","issue":null,"first_page":"1767","last_page":"1780"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9739000201225281,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9739000201225281,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12879","display_name":"Distributed Sensor Networks and Detection Algorithms","score":0.9685999751091003,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11946","display_name":"Antenna Design and Optimization","score":0.9660000205039978,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7867078185081482},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6996880173683167},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6268385052680969},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4475098252296448},{"id":"https://openalex.org/keywords/beam","display_name":"Beam (structure)","score":0.4258390963077545},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3879181146621704},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.3220560848712921},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11658623814582825}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7867078185081482},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6996880173683167},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6268385052680969},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4475098252296448},{"id":"https://openalex.org/C168834538","wikidata":"https://www.wikidata.org/wiki/Q3705329","display_name":"Beam (structure)","level":2,"score":0.4258390963077545},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3879181146621704},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.3220560848712921},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11658623814582825},{"id":"https://openalex.org/C147176958","wikidata":"https://www.wikidata.org/wiki/Q77590","display_name":"Civil engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/twc.2025.3592854","is_oa":false,"landing_page_url":"https://doi.org/10.1109/twc.2025.3592854","pdf_url":null,"source":{"id":"https://openalex.org/S63459445","display_name":"IEEE Transactions on Wireless Communications","issn_l":"1536-1276","issn":["1536-1276","1558-2248"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Wireless Communications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G178412217","display_name":null,"funder_award_id":"2024YFE0200700","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2374063051","display_name":null,"funder_award_id":"2242022k60002","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G3630466707","display_name":null,"funder_award_id":"U1936201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8475670238","display_name":null,"funder_award_id":"61971128","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G900479562","display_name":null,"funder_award_id":"62225107","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G986520376","display_name":null,"funder_award_id":"2020YFB1804901","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W2018744547","https://openalex.org/W2083506609","https://openalex.org/W2109910161","https://openalex.org/W2147601077","https://openalex.org/W2579253290","https://openalex.org/W2737761798","https://openalex.org/W2963406768","https://openalex.org/W2964227312","https://openalex.org/W2999272775","https://openalex.org/W3016197022","https://openalex.org/W3037164854","https://openalex.org/W3072033075","https://openalex.org/W3083569984","https://openalex.org/W3118245008","https://openalex.org/W3127867641","https://openalex.org/W3133546437","https://openalex.org/W3136003212","https://openalex.org/W3157573981","https://openalex.org/W3167193327","https://openalex.org/W3168169223","https://openalex.org/W3194620979","https://openalex.org/W3204401797","https://openalex.org/W3211270128","https://openalex.org/W3212590122","https://openalex.org/W4205381552","https://openalex.org/W4206931804","https://openalex.org/W4297964528","https://openalex.org/W4312288512","https://openalex.org/W4317038426","https://openalex.org/W4324116633","https://openalex.org/W4386025671","https://openalex.org/W4386495279","https://openalex.org/W4387870165","https://openalex.org/W4387883605","https://openalex.org/W4388145348","https://openalex.org/W4388430313","https://openalex.org/W4389924236","https://openalex.org/W4390659317","https://openalex.org/W4392908419","https://openalex.org/W4393972738","https://openalex.org/W4396523201"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2964765435"],"abstract_inverted_index":{"The":[0],"multiple-input":[1],"multiple-output":[2],"dual":[3],"functional":[4],"radar":[5,25],"communication":[6,18,27],"(MIMO-DFRC)":[7],"system":[8,73],"is":[9,32,44,102],"a":[10,33,71,78,84,184,206],"promising":[11,202],"platform":[12],"for":[13,70,97],"future":[14],"integrated":[15],"sensing":[16],"and":[17,26,49,82,99,136,176,190],"applications.":[19],"Ensuring":[20],"reliable":[21],"performance":[22,179],"of":[23,115,133,183,187],"both":[24],"functions,":[28],"the":[29,40,66,109,113,127,134,154,161,168,198,211],"beam":[30,41,67,95,118,173],"selection":[31,42,68,96,174],"critical":[34],"technology":[35],"in":[36,58,108],"MIMO-DFRC":[37,72],"systems.":[38,60],"However,":[39],"problem":[43,69,158],"known":[45],"to":[46,129,152,204],"be":[47],"NP-hard,":[48],"efficiently":[50],"addressing":[51],"it":[52,76],"remains":[53],"an":[54,105,122,147],"open":[55],"issue,":[56],"especially":[57],"distributed":[59],"In":[61,91],"this":[62],"paper,":[63],"we":[64,120,195],"address":[65],"by":[74,104,112,160],"formulating":[75],"as":[77],"semi-Markov":[79],"decision":[80],"process":[81],"propose":[83],"novel":[85],"hierarchical":[86,116,213],"reinforcement":[87],"learning":[88],"(HRL)":[89],"algorithm.":[90],"our":[92],"approach,":[93],"codebook-based":[94],"transmitting":[98],"receiving":[100],"BS":[101],"controlled":[103],"agent":[106,128],"deployed":[107],"cloud.":[110],"Inspired":[111],"mechanism":[114],"codebook":[117,135,214],"training,":[119],"employ":[121],"option-based":[123,162],"policy":[124,209],"that":[125,167,197],"enables":[126],"explore":[130],"different":[131],"layers":[132],"extract":[137],"context":[138],"information":[139],"across":[140],"multiple":[141],"discrete":[142],"time":[143],"steps.":[144],"We":[145],"utilize":[146],"invalid":[148],"action":[149,156],"masking":[150],"technique":[151],"overcome":[153],"dynamic":[155],"space":[157],"caused":[159],"policy.":[163],"Simulation":[164],"results":[165],"demonstrate":[166],"HRL-based":[169],"algorithm":[170,200],"outperforms":[171],"existing":[172],"methods":[175],"achieves":[177],"remarkable":[178],"even":[180],"under":[181],"conditions":[182],"high":[185],"probability":[186],"false":[188],"alarm":[189],"low":[191],"signal-to-noise":[192],"ratio.":[193],"Furthermore,":[194],"find":[196],"proposed":[199],"exhibits":[201],"capabilities":[203],"learn":[205],"more":[207],"efficient":[208],"beyond":[210],"full":[212],"training":[215],"trajectory.":[216]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
