{"id":"https://openalex.org/W3121645716","doi":"https://doi.org/10.1109/globecom42002.2020.9322372","title":"Deep Reinforcement Learning for Robust Beamforming in IRS-assisted Wireless Communications","display_name":"Deep Reinforcement Learning for Robust Beamforming in IRS-assisted Wireless Communications","publication_year":2020,"publication_date":"2020-12-01","ids":{"openalex":"https://openalex.org/W3121645716","doi":"https://doi.org/10.1109/globecom42002.2020.9322372","mag":"3121645716"},"language":"en","primary_location":{"id":"doi:10.1109/globecom42002.2020.9322372","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom42002.2020.9322372","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2020 - 2020 IEEE Global Communications Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059445819","display_name":"Jiaye Lin","orcid":"https://orcid.org/0009-0002-4485-6612"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaye Lin","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5097023405","display_name":"Yuze Zout","orcid":null},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuze Zout","raw_affiliation_strings":["School of Electronic Information and Communications, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Communications, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052575788","display_name":"Xiaoru Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoru Dong","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042460024","display_name":"Shimin Gong","orcid":"https://orcid.org/0000-0003-4874-8766"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shimin Gong","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007992576","display_name":"Dinh Thai Hoang","orcid":"https://orcid.org/0000-0002-9528-0863"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Dinh Thai Hoang","raw_affiliation_strings":["China School of Electrical and Data Engineering, University of Technology Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"China School of Electrical and Data Engineering, University of Technology Sydney, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091266202","display_name":"Dusit Niyato","orcid":"https://orcid.org/0000-0002-7442-7416"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dusit Niyato","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5059445819"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":3.2878,"has_fulltext":false,"cited_by_count":57,"citation_normalized_percentile":{"value":0.92906773,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11192","display_name":"Underwater Vehicles and Communication Systems","score":0.9778000116348267,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.9621000289916992,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.9230153560638428},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7665441036224365},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6556612253189087},{"id":"https://openalex.org/keywords/telecommunications-link","display_name":"Telecommunications link","score":0.5873228311538696},{"id":"https://openalex.org/keywords/transmitter-power-output","display_name":"Transmitter power output","score":0.5372045040130615},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5365367531776428},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.5180795192718506},{"id":"https://openalex.org/keywords/power-control","display_name":"Power control","score":0.4858510196208954},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.48219552636146545},{"id":"https://openalex.org/keywords/signal-to-noise-ratio","display_name":"Signal-to-noise ratio (imaging)","score":0.42451009154319763},{"id":"https://openalex.org/keywords/convex-optimization","display_name":"Convex optimization","score":0.4235437214374542},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.36530742049217224},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.3035222887992859},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24969643354415894},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23681241273880005},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.19819220900535583},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18028682470321655},{"id":"https://openalex.org/keywords/regular-polygon","display_name":"Regular polygon","score":0.17308419942855835},{"id":"https://openalex.org/keywords/transmitter","display_name":"Transmitter","score":0.11055523157119751}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.9230153560638428},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7665441036224365},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6556612253189087},{"id":"https://openalex.org/C138660444","wikidata":"https://www.wikidata.org/wiki/Q5607897","display_name":"Telecommunications link","level":2,"score":0.5873228311538696},{"id":"https://openalex.org/C65422117","wikidata":"https://www.wikidata.org/wiki/Q358527","display_name":"Transmitter power output","level":4,"score":0.5372045040130615},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5365367531776428},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.5180795192718506},{"id":"https://openalex.org/C56685638","wikidata":"https://www.wikidata.org/wiki/Q2300474","display_name":"Power control","level":3,"score":0.4858510196208954},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.48219552636146545},{"id":"https://openalex.org/C13944312","wikidata":"https://www.wikidata.org/wiki/Q7512748","display_name":"Signal-to-noise ratio (imaging)","level":2,"score":0.42451009154319763},{"id":"https://openalex.org/C157972887","wikidata":"https://www.wikidata.org/wiki/Q463359","display_name":"Convex optimization","level":3,"score":0.4235437214374542},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.36530742049217224},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.3035222887992859},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24969643354415894},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23681241273880005},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.19819220900535583},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18028682470321655},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.17308419942855835},{"id":"https://openalex.org/C47798520","wikidata":"https://www.wikidata.org/wiki/Q190157","display_name":"Transmitter","level":3,"score":0.11055523157119751},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/globecom42002.2020.9322372","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globecom42002.2020.9322372","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"GLOBECOM 2020 - 2020 IEEE Global Communications Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3338121238","display_name":null,"funder_award_id":"NRF2017EWT-EP003-041,NRF2015-NRF-ISF001-2277","funder_id":"https://openalex.org/F4320320743","funder_display_name":"Energy Market Authority of Singapore"},{"id":"https://openalex.org/G5607896541","display_name":null,"funder_award_id":"20201269","funder_id":"https://openalex.org/F4320336008","funder_display_name":"National College Students Innovation and Entrepreneurship Training Program"},{"id":"https://openalex.org/G5828897022","display_name":null,"funder_award_id":"M4082187(4080)","funder_id":"https://openalex.org/F4320320766","funder_display_name":"Nanyang Technological University"},{"id":"https://openalex.org/G6812608597","display_name":null,"funder_award_id":"61972434","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7233677137","display_name":null,"funder_award_id":"JCYJ20190807154009444","funder_id":"https://openalex.org/F4320335770","funder_display_name":"Shenzhen Technical Project"},{"id":"https://openalex.org/G937018033","display_name":null,"funder_award_id":"19LGPY292","funder_id":"https://openalex.org/F4320321160","funder_display_name":"Sun Yat-sen University"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320320743","display_name":"Energy Market Authority of Singapore","ror":"https://ror.org/05tqbd879"},{"id":"https://openalex.org/F4320320766","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321160","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71"},{"id":"https://openalex.org/F4320335770","display_name":"Shenzhen Technical Project","ror":null},{"id":"https://openalex.org/F4320336008","display_name":"National College Students Innovation and Entrepreneurship Training Program","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1996215314","https://openalex.org/W2121863487","https://openalex.org/W2891354184","https://openalex.org/W2898035736","https://openalex.org/W2950077417","https://openalex.org/W2963121727","https://openalex.org/W2963864421","https://openalex.org/W2970670564","https://openalex.org/W3000522337","https://openalex.org/W3001613668","https://openalex.org/W3006762012","https://openalex.org/W3009554119","https://openalex.org/W3009563387","https://openalex.org/W3010384738","https://openalex.org/W3015734880","https://openalex.org/W3018514437","https://openalex.org/W3027118737","https://openalex.org/W3037274483","https://openalex.org/W3045926576","https://openalex.org/W3046938740","https://openalex.org/W3100536113","https://openalex.org/W3103493968","https://openalex.org/W3163796467","https://openalex.org/W3169262754","https://openalex.org/W6684921986","https://openalex.org/W6775995824","https://openalex.org/W6776091530"],"related_works":["https://openalex.org/W3087844490","https://openalex.org/W3090699061","https://openalex.org/W4387546583","https://openalex.org/W2188391530","https://openalex.org/W2055634632","https://openalex.org/W2051762234","https://openalex.org/W2131408743","https://openalex.org/W1510659114","https://openalex.org/W2787827467","https://openalex.org/W2124240980"],"abstract_inverted_index":{"Intelligent":[0],"reflecting":[1],"surface":[2],"(IRS)":[3],"is":[4,107],"a":[5,14,20,32,52,73,95,99,116,132],"promising":[6],"technology":[7],"to":[8,19,46,58,147,178],"assist":[9],"downlink":[10],"information":[11],"transmissions":[12],"from":[13,85],"multi-antenna":[15],"access":[16],"point":[17],"(AP)":[18],"receiver.":[21],"In":[22,125],"this":[23],"paper,":[24],"we":[25,50,93,140],"minimize":[26],"the":[27,36,41,59,66,82,90,103,110,128,135,143,149,153,164,171,179],"AP's":[28,37],"transmit":[29],"power":[30,54,68],"by":[31],"joint":[33],"optimization":[34],"of":[35,134,152],"active":[38,156],"beamforming":[39,83],"and":[40,65,113,174],"IRS's":[42,67],"passive":[43,138],"beamforming.":[44],"Due":[45],"uncertain":[47],"channel":[48],"conditions,":[49],"formulate":[51],"robust":[53,104],"minimization":[55],"problem":[56],"subject":[57],"receiver's":[60],"signal-to-noise":[61],"ratio":[62],"(SNR)":[63],"requirement":[64],"budget":[69],"constraint.":[70],"We":[71],"propose":[72],"deep":[74,119],"reinforcement":[75],"learning":[76,91,172],"(DRL)":[77],"approach":[78],"that":[79,163],"can":[80,141,168],"adapt":[81],"strategies":[84],"past":[86],"experiences.":[87],"To":[88],"improve":[89,169],"performance,":[92],"derive":[94],"convex":[96,145],"approximation":[97,146],"as":[98],"lower":[100],"bound":[101],"on":[102],"problem,":[105],"which":[106],"integrated":[108],"with":[109],"DRL":[111],"framework":[112],"thus":[114],"promoting":[115],"novel":[117],"optimization-driven":[118,165],"deterministic":[120],"policy":[121],"gradient":[122],"(DDPG)":[123],"approach.":[124],"particular,":[126],"when":[127],"DDPG":[129,166,181],"algorithm":[130,167],"generates":[131],"part":[133,151],"action":[136,154],"(e.g.,":[137,155],"beamforming),":[139],"use":[142],"model-based":[144],"optimize":[148],"other":[150],"beamforming)":[157],"efficiently.":[158],"Our":[159],"simulation":[160],"results":[161],"demonstrate":[162],"both":[170],"rate":[173],"reward":[175],"significantly":[176],"compared":[177],"conventional":[180],"algorithm.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
