{"id":"https://openalex.org/W4401880338","doi":"https://doi.org/10.1109/icps59941.2024.10640003","title":"Online HVAC Optimization under Comfort Constraints via Reinforcement Learning","display_name":"Online HVAC Optimization under Comfort Constraints via Reinforcement Learning","publication_year":2024,"publication_date":"2024-05-12","ids":{"openalex":"https://openalex.org/W4401880338","doi":"https://doi.org/10.1109/icps59941.2024.10640003"},"language":"en","primary_location":{"id":"doi:10.1109/icps59941.2024.10640003","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icps59941.2024.10640003","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 7th International Conference on Industrial Cyber-Physical Systems (ICPS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034063271","display_name":"Christian Stippel","orcid":"https://orcid.org/0000-0003-0482-902X"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"Christian Stippel","raw_affiliation_strings":["Institut for Computer Technology,TU Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institut for Computer Technology,TU Wien,Vienna,Austria","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093818811","display_name":"Rafael Sterzinger","orcid":"https://orcid.org/0009-0001-0029-8463"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Rafael Sterzinger","raw_affiliation_strings":["Institut for Computer Technology,TU Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institut for Computer Technology,TU Wien,Vienna,Austria","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004288654","display_name":"David Sengl","orcid":null},"institutions":[{"id":"https://openalex.org/I121760703","display_name":"University of Applied Sciences Technikum Wien","ror":"https://ror.org/04jsx0x49","country_code":"AT","type":"education","lineage":["https://openalex.org/I121760703"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"David Sengl","raw_affiliation_strings":["Institute Renewable Energy Systems,UAS Technikum Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institute Renewable Energy Systems,UAS Technikum Wien,Vienna,Austria","institution_ids":["https://openalex.org/I121760703"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111434706","display_name":"Aleksey Bratukhin","orcid":null},"institutions":[{"id":"https://openalex.org/I132976966","display_name":"Universit\u00e4t f\u00fcr Weiterbildung Krems","ror":"https://ror.org/03ef4a036","country_code":"AT","type":"education","lineage":["https://openalex.org/I132976966"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Aleksey Bratukhin","raw_affiliation_strings":["University for Continuing Education Krems,Department for Integrated Sensor Systems,Wiener Neustadt,Austria"],"affiliations":[{"raw_affiliation_string":"University for Continuing Education Krems,Department for Integrated Sensor Systems,Wiener Neustadt,Austria","institution_ids":["https://openalex.org/I132976966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077227223","display_name":"Markus D. Kobelrausch","orcid":null},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Markus Kobelrausch","raw_affiliation_strings":["Institut for Computer Technology,TU Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institut for Computer Technology,TU Wien,Vienna,Austria","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068463445","display_name":"Stefan Wilker","orcid":"https://orcid.org/0000-0002-9873-0751"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Stefan Wilker","raw_affiliation_strings":["Institut for Computer Technology,TU Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institut for Computer Technology,TU Wien,Vienna,Austria","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090568831","display_name":"Thilo Sauter","orcid":"https://orcid.org/0000-0003-1559-8394"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Thilo Sauter","raw_affiliation_strings":["Institut for Computer Technology,TU Wien,Vienna,Austria"],"affiliations":[{"raw_affiliation_string":"Institut for Computer Technology,TU Wien,Vienna,Austria","institution_ids":["https://openalex.org/I145847075"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5034063271"],"corresponding_institution_ids":["https://openalex.org/I145847075"],"apc_list":null,"apc_paid":null,"fwci":1.115,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76064232,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9706000089645386,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hvac","display_name":"HVAC","score":0.7891761064529419},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7808965444564819},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6411160826683044},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.607742965221405},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3225330710411072},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2113494575023651},{"id":"https://openalex.org/keywords/air-conditioning","display_name":"Air conditioning","score":0.14072668552398682},{"id":"https://openalex.org/keywords/mechanical-engineering","display_name":"Mechanical engineering","score":0.07660049200057983},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.07323923707008362}],"concepts":[{"id":"https://openalex.org/C122346748","wikidata":"https://www.wikidata.org/wiki/Q1798773","display_name":"HVAC","level":3,"score":0.7891761064529419},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7808965444564819},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6411160826683044},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.607742965221405},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3225330710411072},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2113494575023651},{"id":"https://openalex.org/C103742991","wikidata":"https://www.wikidata.org/wiki/Q173725","display_name":"Air conditioning","level":2,"score":0.14072668552398682},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.07660049200057983},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.07323923707008362}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icps59941.2024.10640003","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icps59941.2024.10640003","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 7th International Conference on Industrial Cyber-Physical Systems (ICPS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310617","display_name":"Klima- und Energiefonds","ror":"https://ror.org/044ym4p17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2103914933","https://openalex.org/W2736601468","https://openalex.org/W2902257695","https://openalex.org/W2924196570","https://openalex.org/W2946189104","https://openalex.org/W3013294057","https://openalex.org/W3023669592","https://openalex.org/W3037631072","https://openalex.org/W3103997657","https://openalex.org/W3123856535","https://openalex.org/W3166166623","https://openalex.org/W4220894590","https://openalex.org/W4225157558","https://openalex.org/W4241894848","https://openalex.org/W4293217028","https://openalex.org/W4387025761","https://openalex.org/W6692846177","https://openalex.org/W6741002519"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2112866972","https://openalex.org/W4240233711","https://openalex.org/W2900606913","https://openalex.org/W4320003279","https://openalex.org/W2326910963","https://openalex.org/W3111008797","https://openalex.org/W4287552621","https://openalex.org/W4376649626"],"abstract_inverted_index":{"This":[0],"paper":[1],"shows":[2],"the":[3,10,25,41,105,144],"capabilities":[4],"of":[5,12,28,70,116,180],"Reinforcement":[6],"Learning":[7],"to":[8,39,104,141,166],"enhance":[9],"efficiency":[11],"heating,":[13],"ventilation,":[14],"and":[15,30,35,49,64,86,127,134,178],"air":[16,50],"conditioning":[17],"systems":[18],"within":[19],"office":[20],"buildings.":[21],"Our":[22],"research":[23,72,118],"applies":[24],"precise":[26],"management":[27],"temperature":[29,87],"humidity,":[31],"fundamental":[32],"control":[33,57,108,130,156],"algorithms,":[34],"several":[36],"other":[37],"factors":[38],"reduce":[40],"building\u2019s":[42],"power":[43],"consumption":[44,96],"while":[45,89],"improving":[46],"thermal":[47],"comfort":[48],"quality.":[51],"We":[52,149],"succeed":[53],"in":[54,82,94,111],"developing":[55],"optimal":[56],"policies":[58],"by":[59,97],"employing":[60],"Proximal":[61],"Policy":[62],"Optimization":[63],"Advantage":[65],"Actor":[66],"Critic.":[67],"The":[68,114],"outcomes":[69],"our":[71,75,117,151,181],"indicate":[73],"that":[74,174],"RL":[76,121],"framework":[77],"substantially":[78],"outperforms":[79],"existing":[80],"baselines":[81],"maintaining":[83],"ideal":[84],"humidity":[85],"levels":[88],"achieving":[90],"a":[91,161,171],"notable":[92],"reduction":[93],"energy":[95],"$12":[98],"\\%$":[99],"over":[100],"seven":[101],"years":[102],"compared":[103],"current":[106],"static":[107],"logic":[109],"employed":[110],"HVAC":[112,129],"systems.":[113],"contributions":[115],"include":[119],"introducing":[120],"agents":[122],"trained":[123],"online":[124],"for":[125],"effective":[126],"economical":[128],"from":[131],"day":[132],"one":[133],"an":[135],"underlying":[136],"shared":[137],"state":[138],"embedding":[139],"space":[140],"effectively":[142],"understand":[143],"dynamics":[145],"between":[146],"various":[147],"rooms.":[148],"compare":[150],"approach":[152],"against":[153],"four":[154],"baseline":[155],"logics.":[157],"Moreover,":[158],"we":[159],"show":[160],"novel":[162],"socket":[163],"communication":[164],"protocol":[165],"seamlessly":[167],"interact":[168],"with":[169],"TRNSYS18,":[170],"simulation":[172],"environment":[173],"enables":[175],"rapid":[176],"training":[177],"evaluation":[179],"agents.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
