{"id":"https://openalex.org/W4322730848","doi":"https://doi.org/10.1109/tsusc.2023.3251302","title":"Fast Human-in-the-Loop Control for HVAC Systems via Meta-Learning and Model-Based Offline Reinforcement Learning","display_name":"Fast Human-in-the-Loop Control for HVAC Systems via Meta-Learning and Model-Based Offline Reinforcement Learning","publication_year":2023,"publication_date":"2023-03-01","ids":{"openalex":"https://openalex.org/W4322730848","doi":"https://doi.org/10.1109/tsusc.2023.3251302"},"language":"en","primary_location":{"id":"doi:10.1109/tsusc.2023.3251302","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsusc.2023.3251302","pdf_url":null,"source":{"id":"https://openalex.org/S4210221417","display_name":"IEEE Transactions on Sustainable Computing","issn_l":"2377-3782","issn":["2377-3782","2377-3790"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Sustainable Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100729607","display_name":"Liangliang Chen","orcid":"https://orcid.org/0000-0002-9594-640X"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Liangliang Chen","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004137944","display_name":"Fei Meng","orcid":"https://orcid.org/0000-0001-9225-040X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Fei Meng","raw_affiliation_strings":["Department of Electronic Engineering, Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100386001","display_name":"Ying Zhang","orcid":"https://orcid.org/0000-0001-5246-2141"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ying Zhang","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100729607"],"corresponding_institution_ids":["https://openalex.org/I130701444"],"apc_list":null,"apc_paid":null,"fwci":3.6952,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.92866853,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"8","issue":"3","first_page":"504","last_page":"521"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9585999846458435,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8029505610466003},{"id":"https://openalex.org/keywords/hvac","display_name":"HVAC","score":0.7470510601997375},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.6200647950172424},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5933886170387268},{"id":"https://openalex.org/keywords/human-in-the-loop","display_name":"Human-in-the-loop","score":0.489700585603714},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4761742949485779},{"id":"https://openalex.org/keywords/loop","display_name":"Loop (graph theory)","score":0.4756947457790375},{"id":"https://openalex.org/keywords/meta-learning","display_name":"Meta learning (computer science)","score":0.4711151123046875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3976430296897888},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3377869725227356},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.22365346550941467},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10121196508407593},{"id":"https://openalex.org/keywords/air-conditioning","display_name":"Air conditioning","score":0.06793990731239319},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.06715035438537598}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8029505610466003},{"id":"https://openalex.org/C122346748","wikidata":"https://www.wikidata.org/wiki/Q1798773","display_name":"HVAC","level":3,"score":0.7470510601997375},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6200647950172424},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5933886170387268},{"id":"https://openalex.org/C2780626000","wikidata":"https://www.wikidata.org/wiki/Q5936775","display_name":"Human-in-the-loop","level":2,"score":0.489700585603714},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4761742949485779},{"id":"https://openalex.org/C184670325","wikidata":"https://www.wikidata.org/wiki/Q512604","display_name":"Loop (graph theory)","level":2,"score":0.4756947457790375},{"id":"https://openalex.org/C2781002164","wikidata":"https://www.wikidata.org/wiki/Q6822311","display_name":"Meta learning (computer science)","level":3,"score":0.4711151123046875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3976430296897888},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3377869725227356},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.22365346550941467},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10121196508407593},{"id":"https://openalex.org/C103742991","wikidata":"https://www.wikidata.org/wiki/Q173725","display_name":"Air conditioning","level":2,"score":0.06793990731239319},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.06715035438537598},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsusc.2023.3251302","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsusc.2023.3251302","pdf_url":null,"source":{"id":"https://openalex.org/S4210221417","display_name":"IEEE Transactions on Sustainable Computing","issn_l":"2377-3782","issn":["2377-3782","2377-3790"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Sustainable Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8799999952316284,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G2844922344","display_name":null,"funder_award_id":"1837021","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"}],"funders":[{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W1967188314","https://openalex.org/W1980910761","https://openalex.org/W1983236541","https://openalex.org/W1991652125","https://openalex.org/W2145339207","https://openalex.org/W2166681263","https://openalex.org/W2173089344","https://openalex.org/W2176075926","https://openalex.org/W2490662969","https://openalex.org/W2596990139","https://openalex.org/W2625874945","https://openalex.org/W2736080356","https://openalex.org/W2736601468","https://openalex.org/W2767313115","https://openalex.org/W2798500587","https://openalex.org/W2809095263","https://openalex.org/W2889109362","https://openalex.org/W2897258552","https://openalex.org/W2902907165","https://openalex.org/W2913974632","https://openalex.org/W2936062817","https://openalex.org/W2944345882","https://openalex.org/W2950298232","https://openalex.org/W2957897705","https://openalex.org/W2962872206","https://openalex.org/W2965667459","https://openalex.org/W2979476646","https://openalex.org/W2981246288","https://openalex.org/W2989354373","https://openalex.org/W2999298400","https://openalex.org/W2999477184","https://openalex.org/W3012211643","https://openalex.org/W3022566517","https://openalex.org/W3038822267","https://openalex.org/W3043426275","https://openalex.org/W3112672793","https://openalex.org/W3116620831","https://openalex.org/W3130417286","https://openalex.org/W3134563824","https://openalex.org/W3161051625","https://openalex.org/W3166166623","https://openalex.org/W3186524139","https://openalex.org/W3195761866","https://openalex.org/W4200140111","https://openalex.org/W4206801503","https://openalex.org/W4211049957","https://openalex.org/W4214717370","https://openalex.org/W4225917661","https://openalex.org/W4226494903","https://openalex.org/W4283397781","https://openalex.org/W4293498985","https://openalex.org/W4298132949","https://openalex.org/W4316468403","https://openalex.org/W6638018090","https://openalex.org/W6640174482","https://openalex.org/W6684921986","https://openalex.org/W6695011786","https://openalex.org/W6730042731","https://openalex.org/W6736057607","https://openalex.org/W6736938231","https://openalex.org/W6741002519","https://openalex.org/W6745497480","https://openalex.org/W6747473740","https://openalex.org/W6748839928","https://openalex.org/W6751494529","https://openalex.org/W6751869817","https://openalex.org/W6756852718","https://openalex.org/W6757469721","https://openalex.org/W6760405395","https://openalex.org/W6763005135","https://openalex.org/W6763704811","https://openalex.org/W6764053384","https://openalex.org/W6767334564","https://openalex.org/W6767572230","https://openalex.org/W6772522789","https://openalex.org/W6776026728","https://openalex.org/W6776438516","https://openalex.org/W6777091672","https://openalex.org/W6777656069","https://openalex.org/W6779265984","https://openalex.org/W6782145165","https://openalex.org/W6791413555","https://openalex.org/W6801801719","https://openalex.org/W6810277566","https://openalex.org/W6922480057"],"related_works":["https://openalex.org/W2112866972","https://openalex.org/W4240233711","https://openalex.org/W4367173559","https://openalex.org/W4404795748","https://openalex.org/W4294873804","https://openalex.org/W4404893116","https://openalex.org/W4383109125","https://openalex.org/W2891227010","https://openalex.org/W2918964466","https://openalex.org/W2782058284"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,103],"(RL)":[2],"methods":[3],"can":[4,76,134,231],"be":[5],"used":[6,161],"to":[7,39,79,105,119,162,186,195,204],"develop":[8],"a":[9,63,85,101,177,187,237],"controller":[10],"for":[11,69,182,214],"the":[12,32,45,57,90,121,125,130,136,139,146,150,164,169,192,200,206,211,223,228,247],"heating,":[13],"ventilation,":[14],"and":[15,24,44,141,176,208],"air":[16],"conditioning":[17],"(HVAC)":[18],"systems":[19],"that":[20,227],"both":[21],"saves":[22],"energy":[23],"ensures":[25],"high":[26,91],"occupants\u2019":[27,46,81,92,217],"thermal":[28,48,82,87,94,109,122,152,180,218,234],"comfort":[29,95],"levels.":[30],"However,":[31],"existing":[33],"works":[34],"typically":[35],"require":[36],"on-policy":[37,252],"data":[38,253],"train":[40,106,114],"an":[41,107,115],"RL":[42,67,159,193,249],"agent,":[43],"personalized":[47,70,93,151,233],"preferences":[49,83,235],"are":[50],"not":[51],"considered,":[52],"which":[53],"is":[54,160],"limited":[55],"in":[56,138],"real-world":[58],"scenarios.":[59],"This":[60],"paper":[61],"designs":[62],"high-performance":[64],"model-based":[65,158,248],"offline":[66,147,174],"algorithm":[68,75,104,171,194,213,230,250],"HVAC":[71,166,196],"systems.":[72,197],"The":[73],"proposed":[74,170,229],"quickly":[77],"adapt":[78],"different":[80,216],"with":[84,236,246,251],"few":[86,178],"feedbacks,":[88],"guaranteeing":[89],"levels":[96],"efficiently.":[97],"First,":[98],"we":[99,113],"use":[100,199],"meta-supervised":[102],"occupant's":[108],"preference":[110,153],"model.":[111],"Then,":[112],"ensemble":[116,132],"neural":[117],"network":[118],"predict":[120],"states":[123],"of":[124,191,210,240,243],"considered":[126],"zone.":[127],"In":[128],"addition,":[129],"obtained":[131],"networks":[133],"indicate":[135],"regions":[137],"state":[140],"action":[142],"spaces":[143],"covered":[144],"by":[145],"dataset.":[148],"With":[149],"model":[154],"updated":[155],"via":[156],"meta-testing,":[157],"derive":[163],"optimal":[165],"controller.":[167],"Since":[168],"only":[172],"requires":[173],"datasets":[175],"online":[179],"feedbacks":[181],"training,":[183],"it":[184],"contributes":[185],"more":[188],"practical":[189],"deployment":[190],"We":[198],"ASHRAE":[201],"database":[202],"II":[203],"verify":[205],"effectiveness":[207],"advantage":[209],"meta-learning":[212],"modeling":[215],"preferences.":[219],"Numerical":[220],"simulations":[221],"on":[222],"EnergyPlus":[224],"environment":[225],"demonstrate":[226],"guarantee":[232],"slight":[238],"increase":[239],"power":[241],"consumption":[242],"1.91%":[244],"compared":[245],"aggregation.":[254]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
