{"id":"https://openalex.org/W4414603224","doi":"https://doi.org/10.1109/tsg.2025.3615148","title":"Real-Time Operational Strategy for Ice Thermal Storage District Cooling Systems via Model-Free Safe Deep Reinforcement Learning","display_name":"Real-Time Operational Strategy for Ice Thermal Storage District Cooling Systems via Model-Free Safe Deep Reinforcement Learning","publication_year":2025,"publication_date":"2025-09-29","ids":{"openalex":"https://openalex.org/W4414603224","doi":"https://doi.org/10.1109/tsg.2025.3615148"},"language":"en","primary_location":{"id":"doi:10.1109/tsg.2025.3615148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsg.2025.3615148","pdf_url":null,"source":{"id":"https://openalex.org/S59604973","display_name":"IEEE Transactions on Smart Grid","issn_l":"1949-3053","issn":["1949-3053","1949-3061"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Smart Grid","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113052020","display_name":"Z.Y. Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Z. Y. Wang","raw_affiliation_strings":["School of Electric Power Engineering, South China University of Technology, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electric Power Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089279497","display_name":"Jiehui Zheng","orcid":"https://orcid.org/0000-0003-4928-6524"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"J. H. Zheng","raw_affiliation_strings":["School of Electric Power Engineering, South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-4928-6524","affiliations":[{"raw_affiliation_string":"School of Electric Power Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016939864","display_name":"Qinghua Wu","orcid":"https://orcid.org/0000-0002-0598-8367"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Q. H. Wu","raw_affiliation_strings":["School of Electric Power Engineering, South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-0598-8367","affiliations":[{"raw_affiliation_string":"School of Electric Power Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113052020"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":0.6342,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.70556303,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"17","issue":"1","first_page":"217","last_page":"229"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11774","display_name":"Adsorption and Cooling Systems","score":0.9502000212669373,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11774","display_name":"Adsorption and Cooling Systems","score":0.9502000212669373,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6730999946594238},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5605999827384949},{"id":"https://openalex.org/keywords/lagrangian-relaxation","display_name":"Lagrangian relaxation","score":0.538100004196167},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5134000182151794},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4074000120162964},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3799999952316284},{"id":"https://openalex.org/keywords/chiller","display_name":"Chiller","score":0.3659999966621399},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.3553999960422516},{"id":"https://openalex.org/keywords/tardiness","display_name":"Tardiness","score":0.35010001063346863}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6730999946594238},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5728999972343445},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5605999827384949},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5540000200271606},{"id":"https://openalex.org/C91765299","wikidata":"https://www.wikidata.org/wiki/Q3424292","display_name":"Lagrangian relaxation","level":2,"score":0.538100004196167},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5134000182151794},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4074000120162964},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3799999952316284},{"id":"https://openalex.org/C4638862","wikidata":"https://www.wikidata.org/wiki/Q1501558","display_name":"Chiller","level":2,"score":0.3659999966621399},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.3553999960422516},{"id":"https://openalex.org/C2778047078","wikidata":"https://www.wikidata.org/wiki/Q82299449","display_name":"Tardiness","level":4,"score":0.35010001063346863},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.3474999964237213},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.34299999475479126},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.3427000045776367},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.33090001344680786},{"id":"https://openalex.org/C183287310","wikidata":"https://www.wikidata.org/wiki/Q2142963","display_name":"Thermal energy storage","level":2,"score":0.32919999957084656},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.32350000739097595},{"id":"https://openalex.org/C115527620","wikidata":"https://www.wikidata.org/wiki/Q769909","display_name":"Nonlinear programming","level":3,"score":0.3172000050544739},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C131097465","wikidata":"https://www.wikidata.org/wiki/Q178898","display_name":"Gas compressor","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C193254401","wikidata":"https://www.wikidata.org/wiki/Q2160088","display_name":"Robust optimization","level":2,"score":0.29829999804496765},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.29170000553131104},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.28290000557899475},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2784000039100647},{"id":"https://openalex.org/C73684929","wikidata":"https://www.wikidata.org/wiki/Q598870","display_name":"Lagrange multiplier","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C123516432","wikidata":"https://www.wikidata.org/wiki/Q572309","display_name":"Chilled water","level":3,"score":0.2727000117301941},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2644999921321869},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsg.2025.3615148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsg.2025.3615148","pdf_url":null,"source":{"id":"https://openalex.org/S59604973","display_name":"IEEE Transactions on Smart Grid","issn_l":"1949-3053","issn":["1949-3053","1949-3061"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Smart Grid","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4575862285","display_name":null,"funder_award_id":"2024A1515240034","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G8910474879","display_name":null,"funder_award_id":"52477097","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1614818300","https://openalex.org/W2073314543","https://openalex.org/W2585893816","https://openalex.org/W2592721868","https://openalex.org/W2614661877","https://openalex.org/W2753070270","https://openalex.org/W2767192707","https://openalex.org/W2902533895","https://openalex.org/W2923786034","https://openalex.org/W3118987800","https://openalex.org/W4210294974","https://openalex.org/W4281763617","https://openalex.org/W4285120868","https://openalex.org/W4320340663","https://openalex.org/W4365129769","https://openalex.org/W4377136712","https://openalex.org/W4380930412","https://openalex.org/W4384466576","https://openalex.org/W4385741161","https://openalex.org/W4390938819","https://openalex.org/W4392889863","https://openalex.org/W4398224797","https://openalex.org/W4400770903","https://openalex.org/W4405304024","https://openalex.org/W4412375006"],"related_works":[],"abstract_inverted_index":{"District":[0],"cooling":[1,6],"system":[2],"(DCS)":[3],"offers":[4],"centralized":[5],"services":[7],"for":[8,56],"building":[9],"groups":[10],"that":[11,187],"significantly":[12],"reduce":[13],"energy":[14],"consumption":[15],"and":[16,28,67,101,125,138,158,177,183,194,203],"carbon":[17],"emissions.":[18],"However,":[19],"existing":[20],"model-based":[21,193],"methods":[22],"struggle":[23],"with":[24],"the":[25,32,57,90,93,97,119,126,142,147,155,163,188],"large-scale,":[26],"stochastic,":[27],"nonlinear":[29],"characteristics":[30],"of":[31,64,162],"DCS":[33,58],"optimization":[34],"problem":[35,77],"under":[36,72],"strict":[37],"time":[38],"limits.":[39],"To":[40],"fill":[41],"this":[42,45],"research":[43],"gap,":[44],"paper":[46],"proposes":[47],"a":[48,81,173],"model-free":[49],"safe":[50],"deep":[51,165],"reinforcement":[52],"learning":[53,132],"(MFS-DRL)":[54],"algorithm":[55],"to":[59,87,134,153],"deliver":[60],"real-time":[61],"scheduling":[62],"strategies":[63],"multiple":[65],"chillers":[66],"ice":[68],"thermal":[69],"storage":[70],"units":[71],"varying":[73],"operating":[74],"conditions.":[75],"The":[76],"is":[78,116,128,151],"modeled":[79],"as":[80],"constrained":[82],"Markov":[83],"decision":[84],"process":[85],"(CMDP)":[86],"systematically":[88],"decouple":[89],"objective":[91],"from":[92],"constraint,":[94],"therefore":[95],"overcoming":[96],"confusion":[98],"between":[99,175],"reward":[100],"penalty":[102,106],"caused":[103],"by":[104],"manual":[105],"coefficients":[107],"in":[108,141],"traditional":[109],"DRL":[110],"methods.":[111],"Moreover,":[112],"prior":[113],"expert":[114],"knowledge":[115],"acquired":[117],"through":[118],"interior":[120],"point":[121],"optimizer":[122],"(IPOPT)":[123],"solver,":[124],"agent":[127],"pre-trained":[129],"using":[130],"imitation":[131],"(IL)":[133],"mitigate":[135],"exploration":[136],"disorder":[137],"local":[139],"convergence":[140],"early":[143],"training":[144],"stage.":[145],"Ultimately,":[146],"Lagrangian":[148],"relaxation":[149],"approach":[150],"applied":[152],"modify":[154],"optimality":[156],"criteria":[157],"gradient":[159,168],"update":[160],"rules":[161],"classic":[164],"deterministic":[166],"policy":[167],"(DDPG)":[169],"algorithm,":[170],"thereby":[171],"achieving":[172],"trade-off":[174],"feasibility":[176],"optimality.":[178],"Numerical":[179],"experiments":[180],"on":[181],"12-node":[182],"619-node":[184],"DCSs":[185],"demonstrate":[186],"proposed":[189],"method":[190],"outperforms":[191],"representative":[192],"data-driven":[195],"baselines,":[196],"delivering":[197],"high-quality":[198],"solutions":[199],"within":[200],"only":[201],"milliseconds":[202],"maintaining":[204],"robustness":[205],"across":[206],"hyperparameter":[207],"variations.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
