{"id":"https://openalex.org/W3006344226","doi":"https://doi.org/10.1109/tnnls.2020.2967871","title":"Safe Intermittent Reinforcement Learning With Static and Dynamic Event Generators","display_name":"Safe Intermittent Reinforcement Learning With Static and Dynamic Event Generators","publication_year":2020,"publication_date":"2020-02-11","ids":{"openalex":"https://openalex.org/W3006344226","doi":"https://doi.org/10.1109/tnnls.2020.2967871","mag":"3006344226","pmid":"https://pubmed.ncbi.nlm.nih.gov/32054590"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2020.2967871","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2020.2967871","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053342436","display_name":"Yongliang Yang","orcid":"https://orcid.org/0000-0002-3144-8604"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yongliang Yang","raw_affiliation_strings":["Key Laboratory of Knowledge Automation for Industrial Processes, Ministry of Education, University of Science and Technology Beijing, Beijing, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3144-8604","affiliations":[{"raw_affiliation_string":"Key Laboratory of Knowledge Automation for Industrial Processes, Ministry of Education, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040301558","display_name":"Kyriakos G. Vamvoudakis","orcid":"https://orcid.org/0000-0003-1978-4848"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kyriakos G. Vamvoudakis","raw_affiliation_strings":["Daniel Guggenheim School of Aerospace Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"raw_orcid":"https://orcid.org/0000-0003-1978-4848","affiliations":[{"raw_affiliation_string":"Daniel Guggenheim School of Aerospace Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063118155","display_name":"Hamidreza Modares","orcid":"https://orcid.org/0000-0003-0800-5140"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hamidreza Modares","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"raw_orcid":"https://orcid.org/0000-0003-0800-5140","affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101512101","display_name":"Yixin Yin","orcid":"https://orcid.org/0000-0001-6056-8878"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixin Yin","raw_affiliation_strings":["Key Laboratory of Knowledge Automation for Industrial Processes, Ministry of Education, University of Science and Technology Beijing, Beijing, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6056-8878","affiliations":[{"raw_affiliation_string":"Key Laboratory of Knowledge Automation for Industrial Processes, Ministry of Education, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038037619","display_name":"Donald C. Wunsch","orcid":"https://orcid.org/0000-0002-9726-9051"},"institutions":[{"id":"https://openalex.org/I20382870","display_name":"Missouri University of Science and Technology","ror":"https://ror.org/00scwqd12","country_code":"US","type":"education","lineage":["https://openalex.org/I20382870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Donald C. Wunsch","raw_affiliation_strings":["Missouri University of Science and Technology, Rolla, MO, USA"],"raw_orcid":"https://orcid.org/0000-0002-9726-9051","affiliations":[{"raw_affiliation_string":"Missouri University of Science and Technology, Rolla, MO, USA","institution_ids":["https://openalex.org/I20382870"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5053342436"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":9.4738,"has_fulltext":false,"cited_by_count":101,"citation_normalized_percentile":{"value":0.98380054,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"31","issue":"12","first_page":"5441","last_page":"5455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14083","display_name":"Extremum Seeking Control Systems","score":0.9603000283241272,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9016804099082947},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.845606803894043},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7017268538475037},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5126916170120239},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.4490271508693695},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.44802412390708923},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.4373874366283417},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3128887116909027},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.21980178356170654},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13742870092391968}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9016804099082947},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.845606803894043},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7017268538475037},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5126916170120239},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.4490271508693695},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.44802412390708923},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.4373874366283417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3128887116909027},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.21980178356170654},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13742870092391968},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2020.2967871","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2020.2967871","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:32054590","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32054590","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.4399999976158142,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1566696561","display_name":null,"funder_award_id":"61903028","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2423437851","display_name":null,"funder_award_id":"FRF-BD-17-002A","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G3094653860","display_name":null,"funder_award_id":"W911NF-18-2-0260","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G5205608926","display_name":null,"funder_award_id":"FRF-TP-18-031A1","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G5523829882","display_name":null,"funder_award_id":"2018M641197","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G7973029781","display_name":null,"funder_award_id":"S&AS-1849264","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8491087190","display_name":null,"funder_award_id":"CPS-1851588","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1515851193","https://openalex.org/W1559261542","https://openalex.org/W1606119439","https://openalex.org/W1968908471","https://openalex.org/W1976822687","https://openalex.org/W1978518835","https://openalex.org/W1982107603","https://openalex.org/W1983523797","https://openalex.org/W1988688219","https://openalex.org/W2010152647","https://openalex.org/W2019166202","https://openalex.org/W2032736119","https://openalex.org/W2049933349","https://openalex.org/W2062373349","https://openalex.org/W2097121541","https://openalex.org/W2108286682","https://openalex.org/W2121570671","https://openalex.org/W2146487916","https://openalex.org/W2152161277","https://openalex.org/W2314983263","https://openalex.org/W2319074362","https://openalex.org/W2480536132","https://openalex.org/W2509783950","https://openalex.org/W2513580371","https://openalex.org/W2518470966","https://openalex.org/W2538000344","https://openalex.org/W2560370148","https://openalex.org/W2585299106","https://openalex.org/W2727279496","https://openalex.org/W2765910425","https://openalex.org/W2772102164","https://openalex.org/W2772589676","https://openalex.org/W2788444134","https://openalex.org/W2789789879","https://openalex.org/W2792583192","https://openalex.org/W2793914020","https://openalex.org/W2793996673","https://openalex.org/W2796359973","https://openalex.org/W2803973384","https://openalex.org/W2918660012","https://openalex.org/W2919774326","https://openalex.org/W2921163467","https://openalex.org/W2943066999","https://openalex.org/W2955358943","https://openalex.org/W2970427121","https://openalex.org/W2973021624"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2768698792","https://openalex.org/W2386410636","https://openalex.org/W2025663273","https://openalex.org/W3038962357","https://openalex.org/W3099153698"],"abstract_inverted_index":{"In":[0],"this":[1],"article,":[2],"we":[3,15],"present":[4],"an":[5,32,61],"intermittent":[6,45],"framework":[7],"for":[8],"safe":[9],"reinforcement":[10],"learning":[11],"(RL)":[12],"algorithms.":[13],"First,":[14],"develop":[16],"a":[17,52,55],"barrier":[18],"function-based":[19],"system":[20],"transformation":[21],"to":[22,31,64],"impose":[23],"state":[24],"constraints":[25],"while":[26,69],"converting":[27],"the":[28,66,78,81],"original":[29],"problem":[30,67],"unconstrained":[33],"optimization":[34],"problem.":[35],"Second,":[36],"based":[37],"on":[38],"optimal":[39],"derived":[40],"policies,":[41],"two":[42],"types":[43],"of":[44,80],"feedback":[46],"RL":[47],"algorithms":[48],"are":[49],"presented,":[50],"namely,":[51],"static":[53],"and":[54,73],"dynamic":[56],"one.":[57],"We":[58],"finally":[59],"leverage":[60],"actor/critic":[62],"structure":[63],"solve":[65],"online":[68],"guaranteeing":[70],"optimality,":[71],"stability,":[72],"safety.":[74],"Simulation":[75],"results":[76],"show":[77],"efficacy":[79],"proposed":[82],"approach.":[83]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":20},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":16},{"year":2022,"cited_by_count":20},{"year":2021,"cited_by_count":18},{"year":2020,"cited_by_count":11}],"updated_date":"2026-05-24T08:33:08.758527","created_date":"2025-10-10T00:00:00"}
