{"id":"https://openalex.org/W3184866585","doi":"https://doi.org/10.23919/acc50511.2021.9482917","title":"Grid-Interactive Multi-Zone Building Control Using Reinforcement Learning with Global-Local Policy Search","display_name":"Grid-Interactive Multi-Zone Building Control Using Reinforcement Learning with Global-Local Policy Search","publication_year":2021,"publication_date":"2021-05-25","ids":{"openalex":"https://openalex.org/W3184866585","doi":"https://doi.org/10.23919/acc50511.2021.9482917","mag":"3184866585"},"language":"en","primary_location":{"id":"doi:10.23919/acc50511.2021.9482917","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc50511.2021.9482917","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 American Control Conference (ACC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100362472","display_name":"Xiangyu Zhang","orcid":"https://orcid.org/0000-0003-4857-2318"},"institutions":[{"id":"https://openalex.org/I1297288678","display_name":"National Renewable Energy Laboratory","ror":"https://ror.org/036266993","country_code":"US","type":"facility","lineage":["https://openalex.org/I1297288678","https://openalex.org/I1330989302","https://openalex.org/I2800842121"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiangyu Zhang","raw_affiliation_strings":["U.S. National Renewable Energy Laboratory, Golden, CO, USA"],"affiliations":[{"raw_affiliation_string":"U.S. National Renewable Energy Laboratory, Golden, CO, USA","institution_ids":["https://openalex.org/I1297288678"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045032215","display_name":"Rohit Chintala","orcid":"https://orcid.org/0000-0001-9143-9788"},"institutions":[{"id":"https://openalex.org/I1297288678","display_name":"National Renewable Energy Laboratory","ror":"https://ror.org/036266993","country_code":"US","type":"facility","lineage":["https://openalex.org/I1297288678","https://openalex.org/I1330989302","https://openalex.org/I2800842121"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rohit Chintala","raw_affiliation_strings":["U.S. National Renewable Energy Laboratory, Golden, CO, USA"],"affiliations":[{"raw_affiliation_string":"U.S. National Renewable Energy Laboratory, Golden, CO, USA","institution_ids":["https://openalex.org/I1297288678"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017202620","display_name":"Andrey Bernstein","orcid":"https://orcid.org/0000-0003-4489-8388"},"institutions":[{"id":"https://openalex.org/I1297288678","display_name":"National Renewable Energy Laboratory","ror":"https://ror.org/036266993","country_code":"US","type":"facility","lineage":["https://openalex.org/I1297288678","https://openalex.org/I1330989302","https://openalex.org/I2800842121"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrey Bernstein","raw_affiliation_strings":["U.S. National Renewable Energy Laboratory, Golden, CO, USA"],"affiliations":[{"raw_affiliation_string":"U.S. National Renewable Energy Laboratory, Golden, CO, USA","institution_ids":["https://openalex.org/I1297288678"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008431584","display_name":"Peter Gr\u00e4f","orcid":"https://orcid.org/0000-0003-3150-3404"},"institutions":[{"id":"https://openalex.org/I1297288678","display_name":"National Renewable Energy Laboratory","ror":"https://ror.org/036266993","country_code":"US","type":"facility","lineage":["https://openalex.org/I1297288678","https://openalex.org/I1330989302","https://openalex.org/I2800842121"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peter Graf","raw_affiliation_strings":["U.S. National Renewable Energy Laboratory, Golden, CO, USA"],"affiliations":[{"raw_affiliation_string":"U.S. National Renewable Energy Laboratory, Golden, CO, USA","institution_ids":["https://openalex.org/I1297288678"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070648432","display_name":"Xin Jin","orcid":"https://orcid.org/0000-0001-7746-5955"},"institutions":[{"id":"https://openalex.org/I1297288678","display_name":"National Renewable Energy Laboratory","ror":"https://ror.org/036266993","country_code":"US","type":"facility","lineage":["https://openalex.org/I1297288678","https://openalex.org/I1330989302","https://openalex.org/I2800842121"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Jin","raw_affiliation_strings":["U.S. National Renewable Energy Laboratory, Golden, CO, USA"],"affiliations":[{"raw_affiliation_string":"U.S. National Renewable Energy Laboratory, Golden, CO, USA","institution_ids":["https://openalex.org/I1297288678"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100362472"],"corresponding_institution_ids":["https://openalex.org/I1297288678"],"apc_list":null,"apc_paid":null,"fwci":1.5786,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.81057313,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4155","last_page":"4162"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8932405710220337},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7446284294128418},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7172113656997681},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.6911743879318237},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.5575143098831177},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.532092273235321},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.4495658576488495},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.43802186846733093},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3755503296852112},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34998345375061035},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2833693027496338},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16892346739768982},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10224774479866028},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08743253350257874}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8932405710220337},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7446284294128418},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7172113656997681},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.6911743879318237},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.5575143098831177},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.532092273235321},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.4495658576488495},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.43802186846733093},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3755503296852112},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34998345375061035},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2833693027496338},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16892346739768982},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10224774479866028},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08743253350257874},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/acc50511.2021.9482917","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc50511.2021.9482917","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 American Control Conference (ACC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8999999761581421,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G1304107674","display_name":null,"funder_award_id":"DE-AC36-08GO28308","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"}],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1973944436","https://openalex.org/W1975817662","https://openalex.org/W2019348145","https://openalex.org/W2108152153","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2171830216","https://openalex.org/W2228052882","https://openalex.org/W2255511049","https://openalex.org/W2596367596","https://openalex.org/W2625874945","https://openalex.org/W2734389517","https://openalex.org/W2736601468","https://openalex.org/W2957897705","https://openalex.org/W3045748774","https://openalex.org/W3048008723","https://openalex.org/W4214717370","https://openalex.org/W6644092405"],"related_works":["https://openalex.org/W1990079087","https://openalex.org/W2101188133","https://openalex.org/W4306904969","https://openalex.org/W3202234113","https://openalex.org/W4248731570","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2768698792"],"abstract_inverted_index":{"In":[0,56,72,86],"this":[1],"paper,":[2],"we":[3],"develop":[4],"a":[5,12,42,50,60,68,76,82,122],"grid-interactive":[6],"multi-zone":[7],"building":[8,24,113],"controller":[9,19,99,118],"based":[10],"on":[11],"deep":[13],"reinforcement":[14],"learning":[15],"(RL)":[16],"approach.":[17],"The":[18],"is":[20,65,79],"designed":[21],"to":[22,88,111],"facilitate":[23],"operation":[25,107],"during":[26,105],"normal":[27],"conditions":[28],"and":[29,37,48,108],"demand":[30],"response":[31],"events,":[32],"while":[33],"ensuring":[34],"occupants":[35],"comfort":[36],"energy":[38],"efficiency.":[39],"We":[40,115],"leverage":[41],"continuous":[43],"action":[44],"space":[45],"RL":[46,53,70,98],"formulation,":[47],"devise":[49],"two-stage":[51],"global-local":[52],"training":[54],"framework.":[55],"the":[57,73,89,96,117],"first":[58],"stage,":[59,75],"global":[61],"fast":[62],"policy":[63,83],"search":[64],"performed":[66],"using":[67,81,121],"gradient-free":[69],"algorithm.":[71],"second":[74],"local":[77],"fine-tuning":[78],"conducted":[80],"gradient":[84],"method.":[85],"contrast":[87],"state-of-the-art":[90],"model":[91],"predictive":[92],"control":[93],"(MPC)":[94],"approach,":[95],"proposed":[97],"does":[100],"not":[101],"require":[102],"complex":[103],"computation":[104],"real-time":[106],"can":[109],"adapt":[110],"nonlinear":[112],"models.":[114],"illustrate":[116],"performance":[119],"numerically":[120],"five-zone":[123],"commercial":[124],"building.":[125]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-18T07:56:08.524223","created_date":"2025-10-10T00:00:00"}
