{"id":"https://openalex.org/W2885504492","doi":"https://doi.org/10.23919/acc.2018.8431592","title":"Simulation-Based Policy Gradient and Its Building Control Application","display_name":"Simulation-Based Policy Gradient and Its Building Control Application","publication_year":2018,"publication_date":"2018-06-01","ids":{"openalex":"https://openalex.org/W2885504492","doi":"https://doi.org/10.23919/acc.2018.8431592","mag":"2885504492"},"language":"en","primary_location":{"id":"doi:10.23919/acc.2018.8431592","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2018.8431592","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Annual American Control Conference (ACC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100654317","display_name":"Donghwan Lee","orcid":"https://orcid.org/0000-0002-4962-8478"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Donghwan Lee","raw_affiliation_strings":["Department of Mechanical Science and Engineering, University of Illinois, Urbana-Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Science and Engineering, University of Illinois, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100678615","display_name":"Seungjae Lee","orcid":"https://orcid.org/0000-0001-8068-9570"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Seungjae Lee","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017500444","display_name":"Panagiota Karava","orcid":"https://orcid.org/0009-0002-4242-1375"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Panagiota Karava","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035753295","display_name":"Jianghai Hu","orcid":"https://orcid.org/0000-0002-4250-8852"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jianghai Hu","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100654317"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.9418,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.76769971,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"5424","last_page":"5429"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11371","display_name":"Wind and Air Flow Studies","score":0.9793999791145325,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10928","display_name":"Probabilistic and Robust Engineering Design","score":0.9495000243186951,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hvac","display_name":"HVAC","score":0.9340567588806152},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6227920651435852},{"id":"https://openalex.org/keywords/stochastic-control","display_name":"Stochastic control","score":0.5635979771614075},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5292558073997498},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.519846498966217},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.4979369640350342},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.4941706955432892},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.49097350239753723},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4790409803390503},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4478128254413605},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.43098700046539307},{"id":"https://openalex.org/keywords/gradient-method","display_name":"Gradient method","score":0.4219595491886139},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4204901456832886},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4160844683647156},{"id":"https://openalex.org/keywords/air-conditioning","display_name":"Air conditioning","score":0.41060972213745117},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21959057450294495},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15984174609184265},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13960200548171997},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.13898396492004395},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.13680565357208252},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.1055167019367218}],"concepts":[{"id":"https://openalex.org/C122346748","wikidata":"https://www.wikidata.org/wiki/Q1798773","display_name":"HVAC","level":3,"score":0.9340567588806152},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6227920651435852},{"id":"https://openalex.org/C170131372","wikidata":"https://www.wikidata.org/wiki/Q7617811","display_name":"Stochastic control","level":3,"score":0.5635979771614075},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5292558073997498},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.519846498966217},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.4979369640350342},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.4941706955432892},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.49097350239753723},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4790409803390503},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4478128254413605},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.43098700046539307},{"id":"https://openalex.org/C115680565","wikidata":"https://www.wikidata.org/wiki/Q5977448","display_name":"Gradient method","level":2,"score":0.4219595491886139},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4204901456832886},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4160844683647156},{"id":"https://openalex.org/C103742991","wikidata":"https://www.wikidata.org/wiki/Q173725","display_name":"Air conditioning","level":2,"score":0.41060972213745117},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21959057450294495},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15984174609184265},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13960200548171997},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.13898396492004395},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.13680565357208252},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.1055167019367218},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/acc.2018.8431592","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2018.8431592","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Annual American Control Conference (ACC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W55687146","https://openalex.org/W1549086800","https://openalex.org/W1599997802","https://openalex.org/W1839500782","https://openalex.org/W1965842330","https://openalex.org/W1968359621","https://openalex.org/W1968518983","https://openalex.org/W1971761564","https://openalex.org/W1988382136","https://openalex.org/W1991784919","https://openalex.org/W2029264889","https://openalex.org/W2045578358","https://openalex.org/W2053795702","https://openalex.org/W2054888449","https://openalex.org/W2057405764","https://openalex.org/W2079994361","https://openalex.org/W2084260228","https://openalex.org/W2090859261","https://openalex.org/W2093300872","https://openalex.org/W2097148013","https://openalex.org/W2115247028","https://openalex.org/W2121863487","https://openalex.org/W2125612430","https://openalex.org/W2126849655","https://openalex.org/W2139053308","https://openalex.org/W2147242149","https://openalex.org/W2149479912","https://openalex.org/W2155027007","https://openalex.org/W2156835128","https://openalex.org/W2165150801","https://openalex.org/W2166313543","https://openalex.org/W2170990015","https://openalex.org/W2221739275","https://openalex.org/W2241388696","https://openalex.org/W2400109896","https://openalex.org/W2404228993","https://openalex.org/W2591552503","https://openalex.org/W2596990139","https://openalex.org/W2806452171","https://openalex.org/W3139987781","https://openalex.org/W4205326910","https://openalex.org/W4214717370","https://openalex.org/W4302570325","https://openalex.org/W6683204974","https://openalex.org/W6684205842","https://openalex.org/W6690281514","https://openalex.org/W6733612095","https://openalex.org/W6751910157"],"related_works":["https://openalex.org/W2003408565","https://openalex.org/W2996454280","https://openalex.org/W2929211088","https://openalex.org/W4285822430","https://openalex.org/W1996631192","https://openalex.org/W2885504492","https://openalex.org/W3022264972","https://openalex.org/W4319654131","https://openalex.org/W2568720515","https://openalex.org/W3034848451"],"abstract_inverted_index":{"The":[0],"goal":[1],"of":[2,11,42,89,116],"this":[3,43,64],"paper":[4],"is":[5,38,46],"to":[6,78,102],"study":[7,115],"the":[8,39,52,87,90],"potential":[9],"applicability":[10],"a":[12,47,83,97,104,113],"stochastic":[13,49,70],"approximation-based":[14],"policy":[15],"gradient":[16,88,98],"method":[17],"for":[18,68],"optimal":[19,79],"office":[20],"building":[21,32,117],"HVAC":[22,118],"(Heating,":[23],"Ventilation,":[24],"and":[25,95],"Air":[26],"Conditioning)":[27],"control":[28,73,80,106],"systems.":[29,119],"A":[30],"real-world":[31],"thermal":[33],"dynamics":[34],"with":[35],"occupant":[36],"interactions":[37],"main":[40],"focus":[41],"paper.":[44],"It":[45],"complex":[48],"system":[50],"in":[51],"sense":[53],"that":[54],"its":[55,60,110],"statistical":[56],"properties":[57],"depend":[58],"on":[59],"state":[61],"variables.":[62],"In":[63],"case,":[65],"existing":[66],"approaches,":[67],"instance,":[69],"model":[71],"predictive":[72],"methods,":[74],"cannot":[75],"be":[76],"applied":[77],"designs.":[81],"As":[82],"remedy,":[84],"we":[85],"approximate":[86],"cost":[91],"function":[92],"using":[93],"simulations":[94],"use":[96],"descent":[99],"type":[100],"algorithm":[101],"design":[103],"suboptimal":[105],"policy.":[107],"We":[108],"assess":[109],"performance":[111],"through":[112],"simulation":[114]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
