{"id":"https://openalex.org/W3176048614","doi":"https://doi.org/10.1109/jsac.2021.3087248","title":"Effective Communications: A Joint Learning and Communication Framework for Multi-Agent Reinforcement Learning over Noisy Channels","display_name":"Effective Communications: A Joint Learning and Communication Framework for Multi-Agent Reinforcement Learning over Noisy Channels","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3176048614","doi":"https://doi.org/10.1109/jsac.2021.3087248","mag":"3176048614"},"language":"en","primary_location":{"id":"pmh:oai:iris.unimore.it:11380/1280044","is_oa":true,"landing_page_url":"http://hdl.handle.net/11380/1280044","pdf_url":null,"source":{"id":"https://openalex.org/S4377196326","display_name":"Iris Unimore (University of Modena and Reggio Emilia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122346577","host_organization_name":"University of Modena and Reggio Emilia","host_organization_lineage":["https://openalex.org/I122346577"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},"type":"article","indexed_in":[],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/11380/1280044","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064236204","display_name":"Tze-Yang Tung","orcid":"https://orcid.org/0000-0003-2716-5211"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Tung T. -Y.","raw_affiliation_strings":["Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035697090","display_name":"Szymon Kobus","orcid":"https://orcid.org/0009-0006-3605-9073"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kobus S.","raw_affiliation_strings":["Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023623107","display_name":"Joan S. Pujol Roig","orcid":"https://orcid.org/0000-0001-9209-0207"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Roig J. P.","raw_affiliation_strings":["Samsung Electronics Research and Development Institute UK, Staines-upon-Thames, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Samsung Electronics Research and Development Institute UK, Staines-upon-Thames, U.K","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016883501","display_name":"Den\u0131z G\u00fcnd\u00fcz","orcid":"https://orcid.org/0000-0002-7725-395X"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Gunduz D.","raw_affiliation_strings":["Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Information Processing and Communications Laboratory (IPC-Lab), Imperial College London, London, U.K","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":10.1077,"has_fulltext":false,"cited_by_count":100,"citation_normalized_percentile":{"value":0.98937087,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11513","display_name":"stochastic dynamics and bifurcation","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11513","display_name":"stochastic dynamics and bifurcation","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8592200875282288},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7865312099456787},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.575177013874054},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.4205389618873596},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3702218532562256},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3457961678504944}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8592200875282288},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7865312099456787},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.575177013874054},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.4205389618873596},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3702218532562256},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3457961678504944},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C170154142","wikidata":"https://www.wikidata.org/wiki/Q150737","display_name":"Architectural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"pmh:oai:iris.unimore.it:11380/1280044","is_oa":true,"landing_page_url":"http://hdl.handle.net/11380/1280044","pdf_url":null,"source":{"id":"https://openalex.org/S4377196326","display_name":"Iris Unimore (University of Modena and Reggio Emilia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122346577","host_organization_name":"University of Modena and Reggio Emilia","host_organization_lineage":["https://openalex.org/I122346577"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:iris.unimore.it:11380/1280044","is_oa":true,"landing_page_url":"http://hdl.handle.net/11380/1280044","pdf_url":null,"source":{"id":"https://openalex.org/S4377196326","display_name":"Iris Unimore (University of Modena and Reggio Emilia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122346577","host_organization_name":"University of Modena and Reggio Emilia","host_organization_lineage":["https://openalex.org/I122346577"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"score":0.4399999976158142,"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17"}],"awards":[{"id":"https://openalex.org/G7846425480","display_name":null,"funder_award_id":"677854","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"},{"id":"https://openalex.org/G8105621258","display_name":"Communication-Aware Dynamic Edge Computing (CONNECT)","funder_award_id":"EP/T023600/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2017957151","https://openalex.org/W2050509222","https://openalex.org/W2064675550","https://openalex.org/W2080213916","https://openalex.org/W2081525555","https://openalex.org/W2119717200","https://openalex.org/W2145339207","https://openalex.org/W2150671164","https://openalex.org/W2156737235","https://openalex.org/W2165150801","https://openalex.org/W2173248099","https://openalex.org/W2395575420","https://openalex.org/W2564324149","https://openalex.org/W2666368276","https://openalex.org/W2756196406","https://openalex.org/W2798948906","https://openalex.org/W2803155336","https://openalex.org/W2893836673","https://openalex.org/W2898338514","https://openalex.org/W2902806690","https://openalex.org/W2906647810","https://openalex.org/W2914351253","https://openalex.org/W2946889564","https://openalex.org/W2954559956","https://openalex.org/W2963000099","https://openalex.org/W2963407617","https://openalex.org/W2963588154","https://openalex.org/W2963681240","https://openalex.org/W2963717208","https://openalex.org/W2963864421","https://openalex.org/W2963937357","https://openalex.org/W2964121744","https://openalex.org/W2964198392","https://openalex.org/W2964338167","https://openalex.org/W2968026845","https://openalex.org/W2983400533","https://openalex.org/W2990330051","https://openalex.org/W2993383518","https://openalex.org/W3016715915","https://openalex.org/W3021482604","https://openalex.org/W3024893463","https://openalex.org/W3034611340","https://openalex.org/W3036851434","https://openalex.org/W3044517463","https://openalex.org/W3102125291","https://openalex.org/W3103412725","https://openalex.org/W3120141412","https://openalex.org/W3123911006","https://openalex.org/W3134818623","https://openalex.org/W3180974649","https://openalex.org/W3189491540","https://openalex.org/W4234002534","https://openalex.org/W4289363497","https://openalex.org/W4295846245","https://openalex.org/W4297789683","https://openalex.org/W4299802797","https://openalex.org/W4302570325"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2964765435"],"abstract_inverted_index":{"We":[0,183],"propose":[1],"a":[2,32,44,53,79,115,133,151,155,212],"novel":[3],"formulation":[4],"of":[5,24,92,95,106,236,243],"the":[6,63,70,93,96,99,107,110,117,140,145,159,170,174,188,193,201,207,233,241],"'effectiveness":[7],"problem'":[8],"in":[9,17,35,43,61,65,169],"communications,":[10],"put":[11],"forth":[12],"by":[13,26],"Shannon":[14],"and":[15,41,98,158,230],"Weaver":[16],"their":[18],"seminal":[19],"work":[20],"'The":[21],"Mathematical":[22],"Theory":[23],"Communication',":[25],"considering":[27],"multiple":[28],"agents":[29,118],"communicating":[30],"over":[31,78,132,154],"noisy":[33,80,84,134,156],"channel":[34,86],"order":[36],"to":[37,67,122,129,149,161,180,198,226],"achieve":[38],"better":[39],"coordination":[40],"cooperation":[42],"multi-agent":[45,54],"reinforcement":[46,238],"learning":[47,239],"(MARL)":[48],"framework.":[49],"Specifically,":[50],"we":[51],"consider":[52],"partially":[55],"observable":[56],"Markov":[57],"decision":[58],"process":[59],"(MA-POMDP),":[60],"which":[62,216],"agents,":[64],"addition":[66],"interacting":[68],"with":[69,75,124],"environment,":[71,97],"can":[72,112],"also":[73,128],"communicate":[74,130],"each":[76,101,125],"other":[77,126],"communication":[81,85,142,176,202,245],"channel.":[82,135],"The":[83],"is":[87,104,148,196,203,211],"considered":[88,204],"explicitly":[89],"as":[90],"part":[91,105],"dynamics":[94],"message":[100,152],"agent":[102,111],"sends":[103],"action":[108],"that":[109,164,187,199],"take.":[113],"As":[114],"result,":[116],"learn":[119],"not":[120],"only":[121],"collaborate":[123],"but":[127],"'effectively'":[131],"This":[136,210],"framework":[137,163,195],"generalizes":[138],"both":[139],"traditional":[141],"problem,":[143],"where":[144,173,200],"main":[146],"goal":[147],"convey":[150],"reliably":[153],"channel,":[157],"'learning":[160],"communicate'":[162],"has":[165,217],"received":[166],"recent":[167],"attention":[168],"MARL":[171],"literature,":[172],"underlying":[175,208],"channels":[177],"are":[178],"assumed":[179],"be":[181],"error-free.":[182],"show":[184],"via":[185],"examples":[186],"joint":[189],"policy":[190],"learned":[191],"using":[192],"proposed":[194],"superior":[197],"separately":[205],"from":[206,222],"MA-POMDP.":[209],"very":[213],"powerful":[214],"framework,":[215],"many":[218],"real":[219],"world":[220],"applications,":[221],"autonomous":[223],"vehicle":[224],"planning":[225],"drone":[227],"swarm":[228],"control,":[229],"opens":[231],"up":[232],"rich":[234],"toolbox":[235],"deep":[237],"for":[240],"design":[242],"multi-user":[244],"systems.":[246]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":20},{"year":2024,"cited_by_count":34},{"year":2023,"cited_by_count":25},{"year":2022,"cited_by_count":16},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-17T06:14:20.161405","created_date":"2021-07-05T00:00:00"}
