{"id":"https://openalex.org/W4388327811","doi":"https://doi.org/10.1145/3600100.3626270","title":"Physics-informed model-based reinforcement learning (PI-MBRL) to control building heating systems in low training data regimes","display_name":"Physics-informed model-based reinforcement learning (PI-MBRL) to control building heating systems in low training data regimes","publication_year":2023,"publication_date":"2023-11-03","ids":{"openalex":"https://openalex.org/W4388327811","doi":"https://doi.org/10.1145/3600100.3626270"},"language":"en","primary_location":{"id":"doi:10.1145/3600100.3626270","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3600100.3626270","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th ACM International Conference on Systems for Energy-Efficient Buildings, Cities, and Transportation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://lirias.kuleuven.be/retrieve/69327276-8f48-4372-b512-a90b5ef465d8","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059466422","display_name":"Muhammad Hafeez Saeed","orcid":"https://orcid.org/0000-0003-4688-6049"},"institutions":[{"id":"https://openalex.org/I89206478","display_name":"Engie (Belgium)","ror":"https://ror.org/00c97z041","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210124897","https://openalex.org/I89206478"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Muhammad Hafeez Saeed","raw_affiliation_strings":["ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium"],"affiliations":[{"raw_affiliation_string":"ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium","institution_ids":["https://openalex.org/I89206478","https://openalex.org/I99464096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089050773","display_name":"Hussain Kazmi","orcid":"https://orcid.org/0000-0002-7765-8068"},"institutions":[{"id":"https://openalex.org/I89206478","display_name":"Engie (Belgium)","ror":"https://ror.org/00c97z041","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210124897","https://openalex.org/I89206478"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Hussain Kazmi","raw_affiliation_strings":["ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium"],"affiliations":[{"raw_affiliation_string":"ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium","institution_ids":["https://openalex.org/I89206478","https://openalex.org/I99464096"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024462942","display_name":"Geert Deconinck","orcid":"https://orcid.org/0000-0002-2225-3987"},"institutions":[{"id":"https://openalex.org/I89206478","display_name":"Engie (Belgium)","ror":"https://ror.org/00c97z041","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210124897","https://openalex.org/I89206478"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Geert Deconinck","raw_affiliation_strings":["ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium"],"affiliations":[{"raw_affiliation_string":"ELECTA, KU Leuven, Belgium and \rEnergyVille, Belgium","institution_ids":["https://openalex.org/I89206478","https://openalex.org/I99464096"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059466422"],"corresponding_institution_ids":["https://openalex.org/I89206478","https://openalex.org/I99464096"],"apc_list":null,"apc_paid":null,"fwci":0.1529,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.48949551,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"300","last_page":"302"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10121","display_name":"Building Energy and Comfort Optimization","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10998","display_name":"Heat Transfer and Optimization","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9783999919891357,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8930946588516235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5881687998771667},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5678623914718628},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5629945993423462},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5594040155410767},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5572051405906677},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.492497056722641},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.47884321212768555},{"id":"https://openalex.org/keywords/physical-system","display_name":"Physical system","score":0.42897751927375793},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.4160388112068176},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14885550737380981},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12502068281173706},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.12193763256072998},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11495694518089294}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8930946588516235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5881687998771667},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5678623914718628},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5629945993423462},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5594040155410767},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5572051405906677},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.492497056722641},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47884321212768555},{"id":"https://openalex.org/C116672817","wikidata":"https://www.wikidata.org/wiki/Q1454986","display_name":"Physical system","level":2,"score":0.42897751927375793},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.4160388112068176},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14885550737380981},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12502068281173706},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.12193763256072998},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11495694518089294},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3600100.3626270","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3600100.3626270","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th ACM International Conference on Systems for Energy-Efficient Buildings, Cities, and Transportation","raw_type":"proceedings-article"},{"id":"pmh:oai:lirias2repo.kuleuven.be:20.500.12942/738232","is_oa":true,"landing_page_url":"https://lirias.kuleuven.be/handle/20.500.12942/738232","pdf_url":"https://lirias.kuleuven.be/retrieve/69327276-8f48-4372-b512-a90b5ef465d8","source":{"id":"https://openalex.org/S4306401954","display_name":"Lirias (KU Leuven)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I99464096","host_organization_name":"KU Leuven","host_organization_lineage":["https://openalex.org/I99464096"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"10th ACM International Conference on Systems for Energy-Efficient Buildings, Cities, and Transportation (BuildSys), TURKEY, Istanbul, 15-16 November 2023","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:lirias2repo.kuleuven.be:20.500.12942/738232","is_oa":true,"landing_page_url":"https://lirias.kuleuven.be/handle/20.500.12942/738232","pdf_url":"https://lirias.kuleuven.be/retrieve/69327276-8f48-4372-b512-a90b5ef465d8","source":{"id":"https://openalex.org/S4306401954","display_name":"Lirias (KU Leuven)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I99464096","host_organization_name":"KU Leuven","host_organization_lineage":["https://openalex.org/I99464096"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"10th ACM International Conference on Systems for Energy-Efficient Buildings, Cities, and Transportation (BuildSys), TURKEY, Istanbul, 15-16 November 2023","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6772383909","display_name":null,"funder_award_id":"C24M/21/021","funder_id":"https://openalex.org/F4320322308","funder_display_name":"KU Leuven"},{"id":"https://openalex.org/G8764632332","display_name":null,"funder_award_id":"C24M/21/021","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320321730","display_name":"Fonds Wetenschappelijk Onderzoek","ror":"https://ror.org/03qtxy027"},{"id":"https://openalex.org/F4320322308","display_name":"KU Leuven","ror":"https://ror.org/05f950310"},{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388327811.pdf","grobid_xml":"https://content.openalex.org/works/W4388327811.grobid-xml"},"referenced_works_count":6,"referenced_works":["https://openalex.org/W1491843047","https://openalex.org/W3119776855","https://openalex.org/W3163993681","https://openalex.org/W3209188603","https://openalex.org/W4298857966","https://openalex.org/W4378571872"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2106552856","https://openalex.org/W2089013912","https://openalex.org/W2107890255","https://openalex.org/W2076061571","https://openalex.org/W1987513656","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,8,74,105],"(RL)":[2],"is":[3,51,61],"a":[4,85,100],"data-driven":[5],"technique":[6],"for":[7],"optimal":[9],"control":[10,47,80],"policies":[11],"in":[12,54,151],"complex":[13],"systems.":[14],"Classical":[15],"RL":[16,91],"methods":[17],"rely":[18],"completely":[19],"on":[20,119,136],"data":[21,56,60,125,154],"with":[22,76],"no":[23],"information":[24,78],"about":[25],"physics":[26],"of":[27,36,40,71,84,123,126],"underlying":[28],"system,":[29],"due":[30],"to":[31,79],"which":[32],"they":[33],"are":[34],"oblivious":[35],"the":[37,41,45,69,81,93,112,115,127,145],"physical":[38,77,146],"constraints":[39],"system":[42,83],"while":[43],"deciding":[44],"next":[46],"action.":[48],"This":[49],"effect":[50],"especially":[52],"pronounced":[53],"low":[55,152],"regimes":[57],"(when":[58],"training":[59,153],"limited).":[62],"In":[63],"this":[64],"research":[65],"work,":[66],"we":[67],"discuss":[68],"potential":[70],"model-based":[72,103],"reinforcement":[73,104],"coupled":[75],"thermal":[82,132],"single-zone":[86],"building.":[87],"We":[88],"compare":[89],"two":[90,137],"methods:":[92],"classical":[94],"vanilla":[95],"deep":[96],"Q-networks":[97],"(v-DQN)":[98],"and":[99,129],"novel":[101],"physics-informed":[102],"(PI-MBRL)":[106],"algorithm.":[107],"The":[108],"results":[109,141],"show":[110],"that":[111],"PI-MBRL":[113],"outperforms":[114],"v-DQN":[116],"when":[117,134],"trained":[118],"just":[120],"4":[121],"weeks":[122],"heating":[124],"building":[128],"provides":[130],"greater":[131],"comfort":[133],"tested":[135],"entire":[138],"months.":[139],"These":[140],"indicate":[142],"how":[143],"injecting":[144],"knowledge":[147],"can":[148],"improve":[149],"performance":[150],"regimes.":[155]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
