{"id":"https://openalex.org/W2972841335","doi":"https://doi.org/10.23919/acc.2019.8815077","title":"Block-Decentralized Model-Free Reinforcement Learning Control of Two Time-Scale Networks","display_name":"Block-Decentralized Model-Free Reinforcement Learning Control of Two Time-Scale Networks","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2972841335","doi":"https://doi.org/10.23919/acc.2019.8815077","mag":"2972841335"},"language":"en","primary_location":{"id":"doi:10.23919/acc.2019.8815077","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2019.8815077","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 American Control Conference (ACC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101731714","display_name":"Sayak Mukherjee","orcid":"https://orcid.org/0000-0001-8184-4755"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sayak Mukherjee","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA","Department of Electrical and Computer Engineering, North Carolina State University, Raleigh, NC, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055360778","display_name":"Aranya Chakrabortty","orcid":"https://orcid.org/0000-0002-3474-8215"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aranya Chakrabortty","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA","Department of Electrical and Computer Engineering, North Carolina State University, Raleigh, NC, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040513070","display_name":"He Bai","orcid":"https://orcid.org/0000-0002-4247-0698"},"institutions":[{"id":"https://openalex.org/I115475287","display_name":"Oklahoma State University","ror":"https://ror.org/01g9vbr38","country_code":"US","type":"education","lineage":["https://openalex.org/I115475287"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"He Bai","raw_affiliation_strings":["School of Mechanical and Aerospace Engineering, Oklahoma State University, Stillwater, OK, USA"],"affiliations":[{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Oklahoma State University, Stillwater, OK, USA","institution_ids":["https://openalex.org/I115475287"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101731714"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":2.1995,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.89111566,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2233","last_page":"2238"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11347","display_name":"Neural Networks Stability and Synchronization","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9581000208854675,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8335299491882324},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6304545402526855},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5381008386611938},{"id":"https://openalex.org/keywords/decentralised-system","display_name":"Decentralised system","score":0.47677165269851685},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.47646093368530273},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.46532580256462097},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.4580823481082916},{"id":"https://openalex.org/keywords/perturbation","display_name":"Perturbation (astronomy)","score":0.42112305760383606},{"id":"https://openalex.org/keywords/singular-perturbation","display_name":"Singular perturbation","score":0.41580504179000854},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.24401643872261047},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23254135251045227},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21441355347633362},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.0937495231628418}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8335299491882324},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6304545402526855},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5381008386611938},{"id":"https://openalex.org/C205875254","wikidata":"https://www.wikidata.org/wiki/Q17156857","display_name":"Decentralised system","level":3,"score":0.47677165269851685},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.47646093368530273},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.46532580256462097},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.4580823481082916},{"id":"https://openalex.org/C177918212","wikidata":"https://www.wikidata.org/wiki/Q803623","display_name":"Perturbation (astronomy)","level":2,"score":0.42112305760383606},{"id":"https://openalex.org/C165160513","wikidata":"https://www.wikidata.org/wiki/Q7524249","display_name":"Singular perturbation","level":2,"score":0.41580504179000854},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.24401643872261047},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23254135251045227},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21441355347633362},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0937495231628418},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/acc.2019.8815077","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2019.8815077","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 American Control Conference (ACC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W128980932","https://openalex.org/W601351931","https://openalex.org/W1481652330","https://openalex.org/W1515224583","https://openalex.org/W1584101032","https://openalex.org/W1939127652","https://openalex.org/W2005127705","https://openalex.org/W2024303516","https://openalex.org/W2030205386","https://openalex.org/W2037025184","https://openalex.org/W2062361291","https://openalex.org/W2121863487","https://openalex.org/W2148437632","https://openalex.org/W2148439597","https://openalex.org/W2475698787","https://openalex.org/W2476930474","https://openalex.org/W2484646121","https://openalex.org/W2487144912","https://openalex.org/W2564717627","https://openalex.org/W2913981879","https://openalex.org/W4214717370","https://openalex.org/W4234129930","https://openalex.org/W4301886962"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4327639758","https://openalex.org/W2116787190","https://openalex.org/W2154304710","https://openalex.org/W2019676381","https://openalex.org/W2623488306","https://openalex.org/W1971902905","https://openalex.org/W2006371715"],"abstract_inverted_index":{"In":[0],"this":[1,101],"paper,":[2],"we":[3,85],"present":[4],"a":[5,16,139],"cluster-wise":[6],"decentralized":[7,74,102],"model-free":[8],"reinforcement":[9],"learning":[10,103,122],"(RL)":[11],"based":[12],"control":[13,35],"design":[14,33,42,104,119,135],"for":[15,71,78],"linear":[17],"time-invariant":[18],"consensus":[19],"network.":[20],"We":[21,98],"assume":[22],"that":[23,100],"the":[24,28,34,38,49,53,56,60,87,90,110,121,125,134],"fast":[25],"dynamics":[26,51],"of":[27,52,89,127,133],"network":[29],"is":[30,69,112,136],"stable":[31],"and":[32,55,73,93,124],"to":[36],"shape":[37],"slow":[39,50,64],"dynamics.":[40],"The":[41,62,131],"exploits":[43],"timescale":[44],"separation":[45],"properties":[46],"inherent":[47],"in":[48],"clusters":[54],"weak":[57,115],"couplings":[58],"between":[59],"clusters.":[61],"aggregated":[63],"variable":[65],"from":[66],"each":[67,79],"cluster":[68],"used":[70],"feedback":[72],"controllers":[75],"are":[76],"learned":[77,91],"cluster.":[80],"Using":[81],"singular":[82],"perturbation":[83],"theory,":[84],"show":[86],"sub-optimality":[88],"controller":[92],"provide":[94],"closed-loop":[95],"stability":[96],"conditions.":[97],"prove":[99],"will":[105],"produce":[106],"close-to-optimal":[107],"performance":[108],"if":[109],"clustering":[111],"strong":[113],"with":[114],"inter-cluster":[116],"couplings.":[117],"This":[118],"reduces":[120],"time":[123],"amount":[126],"communication":[128],"links":[129],"required.":[130],"effectiveness":[132],"demonstrated":[137],"using":[138],"numerical":[140],"example.":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":2}],"updated_date":"2026-03-03T08:47:05.690250","created_date":"2025-10-10T00:00:00"}
