{"id":"https://openalex.org/W4308216324","doi":"https://doi.org/10.1109/allerton49937.2022.9929321","title":"Reinforcement Learning using Physics Inspired Graph Convolutional Neural Networks","display_name":"Reinforcement Learning using Physics Inspired Graph Convolutional Neural Networks","publication_year":2022,"publication_date":"2022-09-27","ids":{"openalex":"https://openalex.org/W4308216324","doi":"https://doi.org/10.1109/allerton49937.2022.9929321"},"language":"en","primary_location":{"id":"doi:10.1109/allerton49937.2022.9929321","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton49937.2022.9929321","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 58th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000348675","display_name":"Tong Wu","orcid":"https://orcid.org/0000-0002-7474-6943"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tong Wu","raw_affiliation_strings":["Cornell Tech, Cornell University,Department of Electrical and Computer Engineering,New York City,NY,USA,10044"],"affiliations":[{"raw_affiliation_string":"Cornell Tech, Cornell University,Department of Electrical and Computer Engineering,New York City,NY,USA,10044","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029881017","display_name":"Anna Scaglione","orcid":"https://orcid.org/0000-0002-8892-3680"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anna Scaglione","raw_affiliation_strings":["Cornell Tech, Cornell University,Department of Electrical and Computer Engineering,New York City,NY,USA,10044"],"affiliations":[{"raw_affiliation_string":"Cornell Tech, Cornell University,Department of Electrical and Computer Engineering,New York City,NY,USA,10044","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078056875","display_name":"Daniel Arnold","orcid":"https://orcid.org/0000-0001-8897-1132"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel Arnold","raw_affiliation_strings":["Lawrence Berkeley National Laboratory"],"affiliations":[{"raw_affiliation_string":"Lawrence Berkeley National Laboratory","institution_ids":["https://openalex.org/I148283060"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5000348675"],"corresponding_institution_ids":["https://openalex.org/I205783295"],"apc_list":null,"apc_paid":null,"fwci":1.1936,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.82466813,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8405099511146545},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.638954758644104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5037469267845154},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.498720645904541},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4844372570514679},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2896389067173004}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8405099511146545},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.638954758644104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5037469267845154},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.498720645904541},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4844372570514679},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2896389067173004}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/allerton49937.2022.9929321","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton49937.2022.9929321","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 58th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8899999856948853,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G6778738363","display_name":null,"funder_award_id":"2210012","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2153573511","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2883076328","https://openalex.org/W2902098903","https://openalex.org/W2964321699","https://openalex.org/W2972852318","https://openalex.org/W2991859550","https://openalex.org/W3020785977","https://openalex.org/W3035404531","https://openalex.org/W3043475934","https://openalex.org/W3100789280","https://openalex.org/W3110616637","https://openalex.org/W3117471124","https://openalex.org/W3122780823","https://openalex.org/W3126981000","https://openalex.org/W3132337045","https://openalex.org/W3135258945","https://openalex.org/W3177082290","https://openalex.org/W3185133591","https://openalex.org/W3190160068","https://openalex.org/W3201161517","https://openalex.org/W3203414399","https://openalex.org/W6720006811","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6790242746","https://openalex.org/W6796312900","https://openalex.org/W6799658050","https://openalex.org/W6801340522","https://openalex.org/W6802466547"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890"],"abstract_inverted_index":{"In":[0,107],"this":[1],"work,":[2],"we":[3,42,58,119],"propose":[4],"a":[5,116],"physics":[6],"inspired":[7],"Graph":[8],"Convolutional":[9],"Neural":[10],"Network":[11],"(GCN)-Reinforcement":[12],"Learning":[13],"(RL)":[14],"architecture":[15],"to":[16,83,109,130],"train":[17],"online":[18],"controllers":[19],"policies":[20,142],"for":[21,64,77,115],"the":[22,32,48,60,74,87,111,121,138,148],"optimal":[23],"selection":[24,61],"of":[25,34,62,70,113,123,140],"Distributed":[26],"Energy":[27],"Resources":[28],"(DER)":[29],"set-points.":[30],"While":[31],"use":[33],"GCN":[35,88,114],"is":[36,90],"compatible":[37],"with":[38,47],"any":[39],"DRL":[40],"scheme,":[41],"test":[43,137],"it":[44],"in":[45,96],"combination":[46],"popular":[49],"proximal":[50],"policy":[51],"optimization":[52],"(PPO)":[53],"algorithm":[54],"and,":[55],"as":[56,73],"application,":[57],"consider":[59],"set-points":[63],"Volt/Var":[65],"and":[66,99,146],"Volt/Watt":[67],"control":[68],"logic":[69],"smart":[71],"inverters":[72],"case":[75,122],"study":[76],"DER":[78],"control.":[79],"We":[80,136],"are":[81,126],"able":[82],"show":[84],"numerically":[85],"that":[86,125],"scheme":[89,149],"more":[91],"effective":[92],"than":[93],"various":[94],"benchmarks":[95],"regulating":[97],"voltage":[98,102],"miti-gating":[100],"undesirable":[101],"dynamics":[103],"generated":[104],"by":[105],"cyber-attacks.":[106],"addition":[108],"exploring":[110],"performance":[112],"given":[117],"network,":[118],"investigate":[120],"grids":[124],"dynamically":[127],"changing":[128],"due":[129],"topology":[131],"or":[132],"line":[133],"parameters":[134],"variations.":[135],"robustness":[139],"GCN-RL":[141],"against":[143],"small":[144],"perturbations":[145],"evaluate":[147],"so":[150],"called":[151],"\u201ctransfer":[152],"learning\u201d":[153],"capabilities.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
