{"id":"https://openalex.org/W4410770393","doi":"https://doi.org/10.1109/tsg.2025.3568226","title":"RL2: Reinforce Large Language Model to Assist Safe Reinforcement Learning for Energy Management of Active Distribution Networks","display_name":"RL2: Reinforce Large Language Model to Assist Safe Reinforcement Learning for Energy Management of Active Distribution Networks","publication_year":2025,"publication_date":"2025-05-27","ids":{"openalex":"https://openalex.org/W4410770393","doi":"https://doi.org/10.1109/tsg.2025.3568226"},"language":"en","primary_location":{"id":"doi:10.1109/tsg.2025.3568226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsg.2025.3568226","pdf_url":null,"source":{"id":"https://openalex.org/S59604973","display_name":"IEEE Transactions on Smart Grid","issn_l":"1949-3053","issn":["1949-3053","1949-3061"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Smart Grid","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100022174","display_name":"Xu Yang","orcid":"https://orcid.org/0000-0002-5883-7677"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xu Yang","raw_affiliation_strings":["Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5883-7677","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030737811","display_name":"Chenhui Lin","orcid":"https://orcid.org/0000-0001-7455-8793"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenhui Lin","raw_affiliation_strings":["Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7455-8793","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100448792","display_name":"Haotian Liu","orcid":"https://orcid.org/0000-0001-7939-9242"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haotian Liu","raw_affiliation_strings":["Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7939-9242","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009457440","display_name":"Wenchuan Wu","orcid":"https://orcid.org/0000-0002-8154-2412"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenchuan Wu","raw_affiliation_strings":["Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8154-2412","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, State Key Laboratory of Power Systems, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100022174"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":15.6051,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.99210982,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"16","issue":"4","first_page":"3419","last_page":"3431"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7075681090354919},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5803850293159485},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.46676748991012573},{"id":"https://openalex.org/keywords/energy-management","display_name":"Energy management","score":0.42298591136932373},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4137609601020813},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3215496838092804},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.26284050941467285},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.1171879768371582},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11237528920173645}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7075681090354919},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5803850293159485},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.46676748991012573},{"id":"https://openalex.org/C7817414","wikidata":"https://www.wikidata.org/wiki/Q1779504","display_name":"Energy management","level":3,"score":0.42298591136932373},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4137609601020813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3215496838092804},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.26284050941467285},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.1171879768371582},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11237528920173645},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsg.2025.3568226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsg.2025.3568226","pdf_url":null,"source":{"id":"https://openalex.org/S59604973","display_name":"IEEE Transactions on Smart Grid","issn_l":"1949-3053","issn":["1949-3053","1949-3061"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Smart Grid","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G1157879939","display_name":null,"funder_award_id":"52321004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7649562423","display_name":null,"funder_award_id":"52307101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W2064031160","https://openalex.org/W2088511592","https://openalex.org/W2088543143","https://openalex.org/W2164304826","https://openalex.org/W2885669798","https://openalex.org/W2904246096","https://openalex.org/W2997572754","https://openalex.org/W3043986811","https://openalex.org/W3131436982","https://openalex.org/W3189279150","https://openalex.org/W3199571765","https://openalex.org/W4206269615","https://openalex.org/W4210476130","https://openalex.org/W4214717370","https://openalex.org/W4241079583","https://openalex.org/W4313145927","https://openalex.org/W4319338775","https://openalex.org/W4320015775","https://openalex.org/W4360995403","https://openalex.org/W4382119111","https://openalex.org/W4383340036","https://openalex.org/W4386766887","https://openalex.org/W4387886075","https://openalex.org/W4388579591","https://openalex.org/W4392867353","https://openalex.org/W4400351464","https://openalex.org/W4402877676","https://openalex.org/W6687063787","https://openalex.org/W6737893269","https://openalex.org/W6780559895","https://openalex.org/W6803595505","https://openalex.org/W6809646742","https://openalex.org/W6857151620","https://openalex.org/W6859702968","https://openalex.org/W6869822814"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2354768891","https://openalex.org/W4229332389","https://openalex.org/W1510108650","https://openalex.org/W2322968447","https://openalex.org/W2356819012"],"abstract_inverted_index":{"As":[0],"large-scale":[1],"distributed":[2],"energy":[3,14,47,136],"resources":[4],"are":[5],"integrated":[6],"into":[7],"the":[8,34,44,63,86,100,105,145,168,179,183,195,204,207,214,217],"active":[9],"distribution":[10,24],"networks":[11],"(ADNs),":[12],"effective":[13],"management":[15,48,137],"in":[16,49,59,80,138,152,177],"ADNs":[17,153],"becomes":[18,52],"increasingly":[19],"prominent":[20],"compared":[21],"to":[22,72,98,131,147,166],"traditional":[23],"networks.":[25],"Although":[26],"advanced":[27],"reinforcement":[28],"learning":[29,121],"(RL)":[30],"methods,":[31],"which":[32,70,178],"alleviate":[33],"burden":[35],"of":[36,46,67,194,206,216],"complicated":[37],"modelling":[38],"and":[39,65,82,95,108,119,154,172,186,191],"optimization,":[40],"have":[41],"greatly":[42],"improved":[43],"efficiency":[45,109],"ADNs,":[50],"safety":[51,74,107,150],"a":[53,92,128],"critical":[54],"concern":[55],"for":[56,91,135],"RL":[57,81,134,197],"applications":[58],"real-world":[60],"problems.":[61],"Since":[62],"design":[64],"adjustment":[66],"penalty":[68,101,157],"functions,":[69],"correspond":[71],"operational":[73,106,149],"constraints,":[75],"require":[76],"extensive":[77],"domain":[78],"knowledge":[79],"power":[83],"system":[84],"operation,":[85],"emerging":[87],"ADN":[88,208],"operators":[89],"call":[90],"more":[93],"flexible":[94],"customized":[96],"approach":[97],"address":[99],"functions":[102,170,184],"so":[103],"that":[104],"can":[110],"be":[111],"further":[112],"enhanced.":[113],"Empowered":[114],"with":[115],"strong":[116],"comprehension,":[117],"reasoning,":[118],"in-context":[120],"capabilities,":[122],"large":[123],"language":[124],"models":[125],"(LLMs)":[126],"provide":[127],"promising":[129],"way":[130],"assist":[132],"safe":[133],"ADNs.":[139],"In":[140,159],"this":[141],"paper,":[142],"we":[143,161],"introduce":[144],"LLM":[146,180],"comprehend":[148],"requirements":[151],"generate":[155],"corresponding":[156],"functions.":[158],"addition,":[160],"propose":[162],"an":[163],"RL2":[164],"mechanism":[165],"refine":[167],"generated":[169],"iteratively":[171],"adaptively":[173],"through":[174],"multi-round":[175],"dialogues,":[176],"agent":[181],"adjusts":[182],"pattern":[185],"parameters":[187],"based":[188],"on":[189],"training":[190],"test":[192,211],"performance":[193],"downstream":[196],"agent.":[198],"The":[199],"proposed":[200,218],"method":[201],"significantly":[202],"reduces":[203],"intervention":[205],"operators.":[209],"Comprehensive":[210],"results":[212],"demonstrate":[213],"effectiveness":[215],"method.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":4}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
