{"id":"https://openalex.org/W3081631809","doi":"https://doi.org/10.1109/jiot.2020.3021017","title":"Voting-Based Multiagent Reinforcement Learning for Intelligent IoT","display_name":"Voting-Based Multiagent Reinforcement Learning for Intelligent IoT","publication_year":2020,"publication_date":"2020-09-01","ids":{"openalex":"https://openalex.org/W3081631809","doi":"https://doi.org/10.1109/jiot.2020.3021017","mag":"3081631809"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2020.3021017","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2020.3021017","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080546910","display_name":"Yue Xu","orcid":"https://orcid.org/0000-0003-4074-4357"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210099586","display_name":"Shenzhen Research Institute of Big Data","ror":"https://ror.org/00z1gwf89","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099586"]},{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yue Xu","raw_affiliation_strings":["Key Laboratory of Universal Wireless Communications, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China","Shenzhen Research Institute of Big Data and School of Science and Engineering, Chinese University of Hong Kong, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Universal Wireless Communications, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Shenzhen Research Institute of Big Data and School of Science and Engineering, Chinese University of Hong Kong, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924","https://openalex.org/I4210099586"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056090076","display_name":"Zengde Deng","orcid":"https://orcid.org/0000-0001-8286-0255"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zengde Deng","raw_affiliation_strings":["Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100707460","display_name":"Mengdi Wang","orcid":"https://orcid.org/0000-0002-2101-9507"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mengdi Wang","raw_affiliation_strings":["Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059494893","display_name":"Wenjun Xu","orcid":"https://orcid.org/0000-0001-8767-4742"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjun Xu","raw_affiliation_strings":["Key Laboratory of Universal Wireless Communications, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Universal Wireless Communications, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105881332","display_name":"Anthony Man\u2013Cho So","orcid":"https://orcid.org/0000-0003-2588-7851"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Anthony Man-Cho So","raw_affiliation_strings":["Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009164482","display_name":"Shuguang Cui","orcid":"https://orcid.org/0000-0003-2608-775X"},"institutions":[{"id":"https://openalex.org/I4210099586","display_name":"Shenzhen Research Institute of Big Data","ror":"https://ror.org/00z1gwf89","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099586"]},{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuguang Cui","raw_affiliation_strings":["Shenzhen Research Institute of Big Data and Future Network of Intelligence Institute, Chinese University of Hong Kong, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Research Institute of Big Data and Future Network of Intelligence Institute, Chinese University of Hong Kong, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924","https://openalex.org/I4210099586"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5080546910"],"corresponding_institution_ids":["https://openalex.org/I139759216","https://openalex.org/I4210099586","https://openalex.org/I4210116924"],"apc_list":null,"apc_paid":null,"fwci":1.7735,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.86151573,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"8","issue":"4","first_page":"2681","last_page":"2693"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8472588062286377},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8384217023849487},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.6667091250419617},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6063448190689087},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.526127815246582},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4620700478553772},{"id":"https://openalex.org/keywords/internet-of-things","display_name":"Internet of Things","score":0.4361548125743866},{"id":"https://openalex.org/keywords/linear-programming","display_name":"Linear programming","score":0.41556018590927124},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.41399091482162476},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3540988564491272},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16104480624198914},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.1412504017353058},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07431307435035706}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8472588062286377},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8384217023849487},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.6667091250419617},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6063448190689087},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.526127815246582},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4620700478553772},{"id":"https://openalex.org/C81860439","wikidata":"https://www.wikidata.org/wiki/Q251212","display_name":"Internet of Things","level":2,"score":0.4361548125743866},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.41556018590927124},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41399091482162476},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3540988564491272},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16104480624198914},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.1412504017353058},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07431307435035706},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jiot.2020.3021017","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2020.3021017","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8199999928474426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G2950761795","display_name":null,"funder_award_id":"NSFC- 61771066","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5919707873","display_name":null,"funder_award_id":"2018B030338001","funder_id":"https://openalex.org/F4320336405","funder_display_name":"Special Project for Research and Development in Key areas of Guangdong Province"},{"id":"https://openalex.org/G7106976082","display_name":null,"funder_award_id":"NSFC-61629101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336405","display_name":"Special Project for Research and Development in Key areas of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":89,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W63291521","https://openalex.org/W1488674906","https://openalex.org/W1512919909","https://openalex.org/W1519783625","https://openalex.org/W1540107614","https://openalex.org/W1542941925","https://openalex.org/W2005437559","https://openalex.org/W2098432798","https://openalex.org/W2107544712","https://openalex.org/W2110998393","https://openalex.org/W2118681695","https://openalex.org/W2119567691","https://openalex.org/W2120678009","https://openalex.org/W2121863487","https://openalex.org/W2122701159","https://openalex.org/W2144672231","https://openalex.org/W2148135143","https://openalex.org/W2159941336","https://openalex.org/W2274670401","https://openalex.org/W2289204537","https://openalex.org/W2292533394","https://openalex.org/W2292896113","https://openalex.org/W2395575420","https://openalex.org/W2489939061","https://openalex.org/W2528788999","https://openalex.org/W2553188523","https://openalex.org/W2556370010","https://openalex.org/W2558431499","https://openalex.org/W2567358325","https://openalex.org/W2579592432","https://openalex.org/W2592798481","https://openalex.org/W2594203335","https://openalex.org/W2604873668","https://openalex.org/W2765892966","https://openalex.org/W2766806202","https://openalex.org/W2768629321","https://openalex.org/W2771335004","https://openalex.org/W2772726293","https://openalex.org/W2785315072","https://openalex.org/W2788115019","https://openalex.org/W2886509985","https://openalex.org/W2886567736","https://openalex.org/W2898035736","https://openalex.org/W2905601756","https://openalex.org/W2908261578","https://openalex.org/W2911573951","https://openalex.org/W2922273628","https://openalex.org/W2924948991","https://openalex.org/W2950556355","https://openalex.org/W2951896791","https://openalex.org/W2962691117","https://openalex.org/W2962737466","https://openalex.org/W2962856794","https://openalex.org/W2962990479","https://openalex.org/W2963000099","https://openalex.org/W2963000651","https://openalex.org/W2963028406","https://openalex.org/W2963039558","https://openalex.org/W2963083073","https://openalex.org/W2963325600","https://openalex.org/W2963398524","https://openalex.org/W2963543042","https://openalex.org/W2963615009","https://openalex.org/W2963747324","https://openalex.org/W2964005211","https://openalex.org/W2964170525","https://openalex.org/W2968424451","https://openalex.org/W2968563287","https://openalex.org/W2969195240","https://openalex.org/W2969525674","https://openalex.org/W2997499903","https://openalex.org/W3100707094","https://openalex.org/W3102812201","https://openalex.org/W3106530718","https://openalex.org/W4298023569","https://openalex.org/W6602525666","https://openalex.org/W6631168379","https://openalex.org/W6678494045","https://openalex.org/W6694350876","https://openalex.org/W6712181171","https://openalex.org/W6729964979","https://openalex.org/W6732811253","https://openalex.org/W6734234284","https://openalex.org/W6734678876","https://openalex.org/W6736572398","https://openalex.org/W6747941106","https://openalex.org/W6749032143","https://openalex.org/W6765836026"],"related_works":["https://openalex.org/W4245926026","https://openalex.org/W4311097251","https://openalex.org/W2586548817","https://openalex.org/W2625093826","https://openalex.org/W4306904969","https://openalex.org/W2950174689","https://openalex.org/W4200598720","https://openalex.org/W2921026492","https://openalex.org/W4247463117","https://openalex.org/W2138720691"],"abstract_inverted_index":{"The":[0],"recent":[1],"success":[2],"of":[3,10,17,73,121,132],"single-agent":[4],"reinforcement":[5],"learning":[6,98],"(RL)":[7],"in":[8,28,40,143],"Internet":[9],"Things":[11],"(IoT)":[12],"systems":[13],"motivates":[14],"the":[15,42,50,55,64,69,74,85,96,100,111,119,130],"study":[16],"multiagent":[18,145],"RL":[19],"(MARL),":[20],"which":[21,41,95],"is":[22,52],"more":[23,26],"challenging":[24],"but":[25],"useful":[27],"large-scale":[29],"IoT.":[30],"In":[31,108],"this":[32,60],"article,":[33],"we":[34,62,128],"consider":[35],"a":[36,80,91],"voting-based":[37],"MARL":[38,65],"problem,":[39],"agents":[43],"vote":[44],"to":[45,53,83],"make":[46],"group":[47],"decisions":[48],"and":[49,78,139],"goal":[51],"maximize":[54],"globally":[56],"averaged":[57],"returns.":[58],"To":[59],"end,":[61],"formulate":[63],"problem":[66,77],"based":[67],"on":[68,125],"linear":[70],"programming":[71],"form":[72],"policy":[75],"optimization":[76],"propose":[79,90],"primal-dual":[81],"algorithm":[82,135],"obtain":[84],"optimal":[86],"solution.":[87],"We":[88],"also":[89],"voting":[92],"mechanism":[93],"through":[94],"distributed":[97,112],"achieves":[99],"same":[101],"sublinear":[102],"convergence":[103,131],"rate":[104],"as":[105],"centralized":[106],"learning.":[107],"other":[109],"words,":[110],"decision":[113],"making":[114],"does":[115],"not":[116],"slow":[117],"down":[118],"process":[120],"achieving":[122],"global":[123],"consensus":[124],"optimality.":[126],"Finally,":[127],"verify":[129],"our":[133],"proposed":[134],"with":[136],"numerical":[137],"simulations":[138],"conduct":[140],"case":[141],"studies":[142],"practical":[144],"IoT":[146],"systems.":[147]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":7}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
