{"id":"https://openalex.org/W4379619732","doi":"https://doi.org/10.1109/wocc58016.2023.10139667","title":"Heterogeneous Multi-Agent Reinforcement Learning for Joint Active and Passive Beamforming in IRS Assisted Communications","display_name":"Heterogeneous Multi-Agent Reinforcement Learning for Joint Active and Passive Beamforming in IRS Assisted Communications","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4379619732","doi":"https://doi.org/10.1109/wocc58016.2023.10139667"},"language":"en","primary_location":{"id":"doi:10.1109/wocc58016.2023.10139667","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/wocc58016.2023.10139667","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 32nd Wireless and Optical Communications Conference (WOCC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101411790","display_name":"Ang Gao","orcid":"https://orcid.org/0000-0002-9145-6614"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ang Gao","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102520545","display_name":"Xinshun Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinshun Sun","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108841672","display_name":"Yongshuai Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongshuai Xu","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050892711","display_name":"Wei Liang","orcid":"https://orcid.org/0000-0003-3000-9017"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liang","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University,Xi&#x0027;an,China,710072","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101411790"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04869636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10069","display_name":"Antenna Design and Analysis","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9851999878883362,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.7590201497077942},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7573090195655823},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6942801475524902},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.6076631546020508},{"id":"https://openalex.org/keywords/interference","display_name":"Interference (communication)","score":0.5609576106071472},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.493113249540329},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.48244816064834595},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.45446979999542236},{"id":"https://openalex.org/keywords/transmitter","display_name":"Transmitter","score":0.4386426508426666},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.43601831793785095},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.318214476108551},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.2123776376247406},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17084857821464539},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1486022174358368}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.7590201497077942},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7573090195655823},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6942801475524902},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.6076631546020508},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.5609576106071472},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.493113249540329},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.48244816064834595},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.45446979999542236},{"id":"https://openalex.org/C47798520","wikidata":"https://www.wikidata.org/wiki/Q190157","display_name":"Transmitter","level":3,"score":0.4386426508426666},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.43601831793785095},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.318214476108551},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.2123776376247406},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17084857821464539},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1486022174358368},{"id":"https://openalex.org/C170154142","wikidata":"https://www.wikidata.org/wiki/Q150737","display_name":"Architectural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/wocc58016.2023.10139667","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/wocc58016.2023.10139667","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 32nd Wireless and Optical Communications Conference (WOCC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G8165830064","display_name":null,"funder_award_id":"6142414220406","funder_id":"https://openalex.org/F4320327655","funder_display_name":"Foundation of Science and Technology on Information Assurance Laboratory"}],"funders":[{"id":"https://openalex.org/F4320327655","display_name":"Foundation of Science and Technology on Information Assurance Laboratory","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2891354184","https://openalex.org/W2945534522","https://openalex.org/W2969424089","https://openalex.org/W2978495917","https://openalex.org/W2981792785","https://openalex.org/W2990747873","https://openalex.org/W2995554704","https://openalex.org/W3000577820","https://openalex.org/W3005476696","https://openalex.org/W3010384738","https://openalex.org/W3094619726","https://openalex.org/W4220722339","https://openalex.org/W4285260532","https://openalex.org/W4299802797","https://openalex.org/W4385245566","https://openalex.org/W6738796088","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W2355663289","https://openalex.org/W2106913410","https://openalex.org/W4380372336","https://openalex.org/W2354248671","https://openalex.org/W2359134391","https://openalex.org/W2947628004","https://openalex.org/W2935229758","https://openalex.org/W2352791832","https://openalex.org/W2387913039","https://openalex.org/W2963170046"],"abstract_inverted_index":{"Ahstract-The":[0],"Intelligent":[1],"Reflecting":[2],"Surface":[3],"(IRS)":[4],"has":[5],"the":[6,10,15,62,123,127,134,142,158,163,169,172,182],"potential":[7],"to":[8,52,61,78,118,126,151],"reconstruct":[9],"electromagnetic":[11],"propagation":[12],"environment,":[13],"paving":[14],"way":[16],"for":[17,28,99],"a":[18,40,43,80,89],"new":[19],"multi-IRS":[20,183],"assisted":[21,184],"communications":[22,185],"paradigm":[23],"that":[24],"beams":[25],"scattered":[26],"signals":[27],"improved":[29],"spectrum":[30],"efficiency":[31],"(SE).":[32],"However,":[33],"accurate":[34],"channel":[35,107],"estimation":[36],"and":[37,56,102,113,121,129,137,144,161,178],"sharing":[38],"becomes":[39,76],"challenge":[41],"when":[42,69],"large":[44],"number":[45],"of":[46,84,132,171],"IRS":[47,164],"elements":[48],"are":[49,72],"involved,":[50],"leading":[51],"extra":[53],"hardware":[54],"complexity":[55],"communication":[57,159],"overhead.":[58],"Moreover,":[59],"due":[60],"cross-interference":[63],"caused":[64],"by":[65],"massive":[66],"reflecting":[67],"paths":[68],"multiple":[70,114],"IRSs":[71,115,138],"introduced,":[73],"SE":[74,120,177],"optimization":[75,105,147],"challenging":[77],"achieve":[79],"close-formed":[81],"solution":[82],"because":[83],"non-convexity.":[85],"This":[86],"paper":[87],"improves":[88],"heterogeneous":[90],"based":[91],"multi-agent":[92],"deep":[93],"deterministic":[94],"policy":[95],"gradient":[96],"(MADDPG)":[97],"approach":[98,174],"joint":[100],"active":[101,143],"passive":[103,145],"beamforming":[104,146],"without":[106,149],"estimation,":[108],"where":[109],"base":[110],"station":[111],"(BS)":[112],"cooperatively":[116],"learn":[117],"enhance":[119],"suppress":[122],"interference.":[124],"Due":[125],"centralized-training":[128],"distributed-execution":[130],"feature":[131],"MADDPG,":[133],"well-trained":[135],"BS":[136],"can":[139,155],"execute":[140],"both":[141],"independently":[148],"referring":[150],"other":[152],"agents,":[153],"which":[154],"greatly":[156],"reduce":[157],"overhead":[160],"simplify":[162],"deployment.":[165],"Numeral":[166],"simulations":[167],"demonstrate":[168],"effectiveness":[170],"proposed":[173],"on":[175],"enhancing":[176],"suppressing":[179],"interference":[180],"in":[181],"system.":[186]},"counts_by_year":[],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
