{"id":"https://openalex.org/W4210526511","doi":"https://doi.org/10.1631/fitee.2100331","title":"Multi-agent deep reinforcement learning for end\u2014edge orchestrated resource allocation in industrial wireless networks","display_name":"Multi-agent deep reinforcement learning for end\u2014edge orchestrated resource allocation in industrial wireless networks","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4210526511","doi":"https://doi.org/10.1631/fitee.2100331"},"language":"en","primary_location":{"id":"doi:10.1631/fitee.2100331","is_oa":false,"landing_page_url":"https://doi.org/10.1631/fitee.2100331","pdf_url":null,"source":{"id":"https://openalex.org/S4210189857","display_name":"Frontiers of Information Technology & Electronic Engineering","issn_l":"2095-9184","issn":["2095-9184","2095-9230"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers of Information Technology &amp; Electronic Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067347576","display_name":"Xiaoyu Liu","orcid":"https://orcid.org/0000-0003-3293-0803"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyu Liu","raw_affiliation_strings":["Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100771854","display_name":"Chi Xu","orcid":"https://orcid.org/0000-0001-7389-5763"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chi Xu","raw_affiliation_strings":["Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100383565","display_name":"Haibin Yu","orcid":"https://orcid.org/0000-0002-1663-2956"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haibin Yu","raw_affiliation_strings":["Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005866333","display_name":"Peng Zeng","orcid":"https://orcid.org/0000-0002-3904-9245"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Zeng","raw_affiliation_strings":["Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Networked Control Systems, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100383565","https://openalex.org/A5100771854"],"corresponding_institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":1.9338,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.85962004,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"23","issue":"1","first_page":"47","last_page":"60"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11932","display_name":"Wireless Body Area Networks","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8363416194915771},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8043389916419983},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7433862090110779},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6852060556411743},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.6676787734031677},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5904699563980103},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5808995962142944},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.5198845863342285},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4741334915161133},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.4650835394859314},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.459629625082016},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.4191145598888397},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.32710927724838257},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3256487250328064},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.25509947538375854},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.1351240575313568},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08855050802230835}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8363416194915771},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8043389916419983},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7433862090110779},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6852060556411743},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.6676787734031677},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5904699563980103},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5808995962142944},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.5198845863342285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4741334915161133},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.4650835394859314},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.459629625082016},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.4191145598888397},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.32710927724838257},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3256487250328064},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.25509947538375854},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.1351240575313568},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08855050802230835},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1631/fitee.2100331","is_oa":false,"landing_page_url":"https://doi.org/10.1631/fitee.2100331","pdf_url":null,"source":{"id":"https://openalex.org/S4210189857","display_name":"Frontiers of Information Technology & Electronic Engineering","issn_l":"2095-9184","issn":["2095-9184","2095-9230"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers of Information Technology &amp; Electronic Engineering","raw_type":"journal-article"},{"id":"pmh:oai:ir.sia.cn/:173321/30536","is_oa":false,"landing_page_url":"http://ir.sia.cn/handle/173321/30536","pdf_url":null,"source":{"id":"https://openalex.org/S4377196984","display_name":"SIA OpenIR (Chinese Academy of Sciences)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I19820366","host_organization_name":"Chinese Academy of Sciences","host_organization_lineage":["https://openalex.org/I19820366"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"\u671f\u520a\u8bba\u6587"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2775835322","https://openalex.org/W2786904977","https://openalex.org/W2803750062","https://openalex.org/W2806813423","https://openalex.org/W2898652425","https://openalex.org/W2898754723","https://openalex.org/W2915117209","https://openalex.org/W2932097000","https://openalex.org/W2944442327","https://openalex.org/W2949236164","https://openalex.org/W2962912298","https://openalex.org/W3010723141","https://openalex.org/W3011182939","https://openalex.org/W3012434840","https://openalex.org/W3013536937","https://openalex.org/W3015366655","https://openalex.org/W3036631744","https://openalex.org/W3045546031","https://openalex.org/W3047488480","https://openalex.org/W3080425979","https://openalex.org/W3081088023","https://openalex.org/W3082598040","https://openalex.org/W3090914153","https://openalex.org/W3092311181","https://openalex.org/W3093426589","https://openalex.org/W3105883416","https://openalex.org/W3109858579","https://openalex.org/W3176552354","https://openalex.org/W3200230539","https://openalex.org/W4205516653","https://openalex.org/W4210346062","https://openalex.org/W6835070974"],"related_works":["https://openalex.org/W2092530219","https://openalex.org/W2388464034","https://openalex.org/W2533125852","https://openalex.org/W2140460949","https://openalex.org/W2105580438","https://openalex.org/W2057435755","https://openalex.org/W2018782216","https://openalex.org/W187740018","https://openalex.org/W2162286586","https://openalex.org/W4255368532"],"abstract_inverted_index":{"Edge":[0],"artificial":[1],"intelligence":[2],"will":[3],"empower":[4],"the":[5,20,61,78,103,126,134,166,193],"ever":[6],"simple":[7],"industrial":[8],"wireless":[9],"networks":[10],"(IWNs)":[11],"supporting":[12],"complex":[13],"and":[14,22,30,55,94,107,121,147,161,185],"dynamic":[15],"tasks":[16],"by":[17,170],"collaboratively":[18],"exploiting":[19],"computation":[21,119],"communication":[23],"resources":[24],"of":[25,64,92,129,137,168],"both":[26],"machine-type":[27],"devices":[28],"(MTDs)":[29],"edge":[31],"servers.":[32],"In":[33],"this":[34],"paper,":[35],"we":[36,59,76,98,139,152,164],"propose":[37,153],"a":[38,72,84,141,154],"multi-agent":[39],"deep":[40],"reinforcement":[41],"learning":[42,135],"based":[43],"resource":[44,111,189],"allocation":[45,112,190],"(MADRL-RA)":[46],"algorithm":[47],"for":[48],"end-edge":[49],"orchestrated":[50],"IWNs":[51],"to":[52,82,101,116,145,158],"support":[53],"computation-intensive":[54],"delay-sensitive":[56],"applications.":[57],"First,":[58],"present":[60],"system":[62,86,195],"model":[63],"IWNs,":[65],"wherein":[66],"each":[67],"MTD":[68],"is":[69],"regarded":[70],"as":[71],"self-learning":[73],"agent.":[74],"Then,":[75],"apply":[77],"Markov":[79],"decision":[80],"process":[81,136],"formulate":[83],"minimum":[85,194],"overhead":[87],"problem":[88],"with":[89,114,173],"joint":[90],"optimization":[91],"delay":[93],"energy":[95],"consumption.":[96],"Next,":[97],"employ":[99],"MADRL":[100],"defeat":[102],"explosive":[104],"state":[105],"space":[106],"learn":[108],"an":[109,187],"effective":[110,188],"policy":[113,191],"respect":[115],"computing":[117],"decision,":[118],"capacity,":[120],"transmission":[122],"power.":[123],"To":[124],"break":[125],"time":[127],"correlation":[128],"training":[130],"data":[131],"while":[132],"accelerating":[133],"MADRL-RA,":[138],"design":[140],"weighted":[142],"experience":[143],"replay":[144],"store":[146],"sample":[148],"experiences":[149],"categorically.":[150],"Furthermore,":[151],"step-by-step":[155],"\u03b5-greedy":[156],"method":[157],"balance":[159],"exploitation":[160],"exploration.":[162],"Finally,":[163],"verify":[165],"effectiveness":[167],"MADRL-RA":[169,182],"comparing":[171],"it":[172],"some":[174],"benchmark":[175],"algorithms":[176],"in":[177],"many":[178],"experiments,":[179],"showing":[180],"that":[181],"converges":[183],"quickly":[184],"learns":[186],"achieving":[192],"overhead.":[196]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
