{"id":"https://openalex.org/W4408780478","doi":"https://doi.org/10.1109/tase.2025.3554431","title":"Explainable and Safety Aware Deep Reinforcement Learning-Based Control of Nonlinear Discrete-Time Systems Using Neural Network Gradient Decomposition","display_name":"Explainable and Safety Aware Deep Reinforcement Learning-Based Control of Nonlinear Discrete-Time Systems Using Neural Network Gradient Decomposition","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408780478","doi":"https://doi.org/10.1109/tase.2025.3554431"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2025.3554431","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3554431","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020402404","display_name":"Behzad Farzanegan","orcid":"https://orcid.org/0000-0002-8660-2111"},"institutions":[{"id":"https://openalex.org/I20382870","display_name":"Missouri University of Science and Technology","ror":"https://ror.org/00scwqd12","country_code":"US","type":"education","lineage":["https://openalex.org/I20382870"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Behzad Farzanegan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, MO, USA","Dept. of Elec. and Comp. Engg, Missouri University of Science and Technology, Rolla, MO, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, MO, USA","institution_ids":["https://openalex.org/I20382870"]},{"raw_affiliation_string":"Dept. of Elec. and Comp. Engg, Missouri University of Science and Technology, Rolla, MO, USA","institution_ids":["https://openalex.org/I20382870"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078910343","display_name":"S. Jagannathan","orcid":"https://orcid.org/0000-0002-2310-3737"},"institutions":[{"id":"https://openalex.org/I20382870","display_name":"Missouri University of Science and Technology","ror":"https://ror.org/00scwqd12","country_code":"US","type":"education","lineage":["https://openalex.org/I20382870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarangapani Jagannathan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, MO, USA","Dept. of Elec. and Comp. Engg, Missouri University of Science and Technology, Rolla, MO, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, MO, USA","institution_ids":["https://openalex.org/I20382870"]},{"raw_affiliation_string":"Dept. of Elec. and Comp. Engg, Missouri University of Science and Technology, Rolla, MO, USA","institution_ids":["https://openalex.org/I20382870"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5020402404"],"corresponding_institution_ids":["https://openalex.org/I20382870"],"apc_list":null,"apc_paid":null,"fwci":7.0705,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96176375,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"22","issue":null,"first_page":"13556","last_page":"13568"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.8075000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.8075000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.7124999761581421,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.6593000292778015,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7352035641670227},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.7290931344032288},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.6520330905914307},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.5821089744567871},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5718240141868591},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.518814742565155},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4727393388748169},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.43800050020217896},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.4342377781867981},{"id":"https://openalex.org/keywords/discrete-time-and-continuous-time","display_name":"Discrete time and continuous time","score":0.4186953008174896},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3786960244178772},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.28871047496795654},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17527684569358826}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7352035641670227},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.7290931344032288},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.6520330905914307},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.5821089744567871},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5718240141868591},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.518814742565155},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4727393388748169},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.43800050020217896},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.4342377781867981},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.4186953008174896},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3786960244178772},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28871047496795654},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17527684569358826},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2025.3554431","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3554431","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3364754307","display_name":null,"funder_award_id":"N00014-23-2195","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G5526555046","display_name":null,"funder_award_id":"N00014-23-1-2195","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G7203712336","display_name":null,"funder_award_id":"N00014-21-1-2232","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G8090444566","display_name":null,"funder_award_id":"N00014-24-1-2338","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G8899011038","display_name":null,"funder_award_id":"N00014-24-2338","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1489327260","https://openalex.org/W1980569135","https://openalex.org/W2150841368","https://openalex.org/W2325204300","https://openalex.org/W2345348539","https://openalex.org/W2516809705","https://openalex.org/W2560504659","https://openalex.org/W2735010720","https://openalex.org/W2975408797","https://openalex.org/W3011888914","https://openalex.org/W3045680111","https://openalex.org/W3119933750","https://openalex.org/W3120954879","https://openalex.org/W3127275112","https://openalex.org/W3135195117","https://openalex.org/W3202362797","https://openalex.org/W3206048862","https://openalex.org/W3209924761","https://openalex.org/W4200325667","https://openalex.org/W4312757239","https://openalex.org/W4313146255","https://openalex.org/W4385863710","https://openalex.org/W4386031067","https://openalex.org/W4386108459","https://openalex.org/W4390748515","https://openalex.org/W4390749062","https://openalex.org/W4391128324","https://openalex.org/W4391301040","https://openalex.org/W4395082122","https://openalex.org/W4396911939","https://openalex.org/W4397024165","https://openalex.org/W4399563101","https://openalex.org/W4403826514","https://openalex.org/W4405381559","https://openalex.org/W6737947904","https://openalex.org/W6748380982","https://openalex.org/W6769692591","https://openalex.org/W6772100842","https://openalex.org/W6881361898"],"related_works":["https://openalex.org/W2088845016","https://openalex.org/W589102260","https://openalex.org/W1966421350","https://openalex.org/W1868434454","https://openalex.org/W4366985237","https://openalex.org/W2810569973","https://openalex.org/W2128396103","https://openalex.org/W4366984740","https://openalex.org/W4367299891","https://openalex.org/W4367365565"],"abstract_inverted_index":{"This":[0,228],"paper":[1,229],"presents":[2],"an":[3,148,286,289],"explainable":[4],"deep-reinforcement":[5],"learning":[6,117,294],"(DRL)-based":[7],"safety-aware":[8,73,81,107],"optimal":[9,44,82,166,201],"adaptive":[10],"tracking":[11],"(SOAT)":[12],"scheme":[13,155,253],"for":[14,151,280,292,314],"a":[15,32,189,234,273],"class":[16],"of":[17,60,176,233,319],"nonlinear":[18,256],"discrete-time":[19,257],"(DT)":[20],"affine":[21],"systems":[22,258],"subject":[23],"to":[24,38,66,146,158,196,205,221,226,337],"state":[25,122,262],"inequality":[26,263],"constraints.":[27,264],"The":[28,105,168,265,317],"DRL-based":[29,153,236,251,283],"SOAT":[30,154,252,284],"utilizes":[31],"multilayer":[33],"neural":[34],"network":[35],"(MNN)-based":[36],"actor-critic":[37,126,199,290],"estimate":[39],"the":[40,47,55,68,92,99,102,133,140,152,160,165,174,177,197,231,278,302],"cost":[41,194],"function":[42,62,96],"and":[43,72,119,135,295,346,352],"policy":[45,83,296],"while":[46],"MNN":[48,127,200,287],"update":[49,128],"laws":[50],"are":[51,354],"tuned":[52],"both":[53,114],"using":[54,86],"singular":[56],"value":[57],"decomposition":[58],"(SVD)":[59],"activation":[61],"gradient":[63,70],"in":[64,156,163,192,270],"order":[65,157],"mitigate":[67],"vanishing":[69],"issue":[71],"Bellman":[74,108],"error":[75,109],"at":[76,120],"each":[77],"layer.":[78],"An":[79],"approximate":[80],"is":[84,171,180,213,312],"developed":[85],"Karush-Kuhn\u2013Tucker":[87],"(KKT)":[88],"conditions":[89],"by":[90,323],"incorporating":[91],"higher-order":[93],"control":[94,202,208,237,268,329],"barrier":[95],"(HOCBF)":[97],"into":[98,301],"Hamiltonian":[100],"through":[101],"Lagrangian":[103],"multiplier.":[104],"resulting":[106],"helps":[110],"with":[111,288],"safe":[112,235,305],"exploration":[113],"during":[115,308],"online":[116,309],"phase":[118],"steady":[121],"without":[123],"any":[124],"explicit":[125],"law":[129],"changes.":[130],"To":[131],"study":[132],"explainability":[134,353],"gain":[136],"insights,":[137],"we":[138],"employ":[139],"Shapley":[141],"Additive":[142],"Explanations":[143],"(SHAP)":[144],"method":[145,179],"construct":[147],"explainer":[149],"model":[150],"identify":[159],"important":[161],"features":[162,326],"determining":[164],"policy.":[167,203],"overall":[169],"stability":[170],"established.":[172],"Finally,":[173],"effectiveness":[175],"proposed":[178,267],"demonstrated":[181],"on":[182,272],"Shipboard":[183,274],"Power":[184,275],"Systems":[185],"(SPS),":[186],"achieving":[187],"over":[188],"35%":[190],"reduction":[191],"cumulative":[193],"compared":[195],"existing":[198],"Note":[204],"Practitioners\u2014In":[206],"practical":[207,281],"systems,":[209],"meeting":[210],"safety":[211,248],"constraints":[212,218],"often":[214],"critical":[215,313],"since":[216],"ignoring":[217],"can":[219],"lead":[220],"degraded":[222],"performance":[223,243,269],"or":[224],"damage":[225],"equipment.":[227],"addresses":[230],"challenge":[232],"approach":[238],"that":[239,259,327],"not":[240],"only":[241],"optimizes":[242],"but":[244],"also":[245],"integrates":[246],"robust":[247],"assurances.":[249],"Our":[250],"specifically":[254],"targets":[255],"must":[260],"satisfy":[261],"successful":[266],"simulations":[271],"System":[276],"demonstrates":[277],"potential":[279],"applications.":[282,316],"employs":[285],"framework":[291,336],"continuous":[293],"adaptation.":[297],"Integrating":[298],"HOCBFs":[299],"directly":[300],"optimization":[303],"ensures":[304],"operation,":[306],"even":[307],"learning,":[310],"which":[311],"real-time":[315],"addition":[318],"SHAP":[320],"enhances":[321],"transparency":[322],"identifying":[324],"key":[325],"influence":[328],"decisions.":[330],"Future":[331],"work":[332],"could":[333],"adapt":[334],"this":[335],"other":[338],"constrained":[339],"environments,":[340],"such":[341],"as":[342],"autonomous":[343],"vehicles,":[344],"robotics,":[345],"industrial":[347],"automation,":[348],"where":[349],"safety,":[350],"optimality,":[351],"essential.":[355]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
