{"id":"https://openalex.org/W4406387724","doi":"https://doi.org/10.1109/tcad.2025.3529820","title":"Error Resilient Online Reinforcement Learning Using Adaptive Statistical Checks","display_name":"Error Resilient Online Reinforcement Learning Using Adaptive Statistical Checks","publication_year":2025,"publication_date":"2025-01-15","ids":{"openalex":"https://openalex.org/W4406387724","doi":"https://doi.org/10.1109/tcad.2025.3529820"},"language":"en","primary_location":{"id":"doi:10.1109/tcad.2025.3529820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2025.3529820","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028115522","display_name":"Chandramouli Amarnath","orcid":"https://orcid.org/0000-0001-9938-2157"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chandramouli Amarnath","raw_affiliation_strings":["Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","Department of ECE, Georgia Institute of Technology, United States"],"raw_orcid":"https://orcid.org/0000-0001-9938-2157","affiliations":[{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, United States","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008790654","display_name":"Mohamed Mejri","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohamed Mejri","raw_affiliation_strings":["Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","Department of ECE, Georgia Institute of Technology, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, United States","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jackson Isenberg","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jackson Isenberg","raw_affiliation_strings":["Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","Department of ECE, Georgia Institute of Technology, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, United States","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069579193","display_name":"Abhijit Chatterjee","orcid":"https://orcid.org/0000-0003-1553-4470"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhijit Chatterjee","raw_affiliation_strings":["Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","Department of ECE, Georgia Institute of Technology, United States"],"raw_orcid":"https://orcid.org/0000-0003-1553-4470","affiliations":[{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Department of ECE, Georgia Institute of Technology, United States","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0704,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.75058086,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"44","issue":"8","first_page":"3112","last_page":"3125"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9587000012397766,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9587000012397766,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.951200008392334,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.696631908416748},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.637864351272583},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6115983128547668},{"id":"https://openalex.org/keywords/statistical-learning","display_name":"Statistical learning","score":0.4892146587371826},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44650793075561523},{"id":"https://openalex.org/keywords/online-learning","display_name":"Online learning","score":0.4230560064315796},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3946547210216522},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.18799954652786255},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.11830121278762817},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.08762320876121521}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.696631908416748},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.637864351272583},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6115983128547668},{"id":"https://openalex.org/C2982736386","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Statistical learning","level":2,"score":0.4892146587371826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44650793075561523},{"id":"https://openalex.org/C2986087404","wikidata":"https://www.wikidata.org/wiki/Q15946010","display_name":"Online learning","level":2,"score":0.4230560064315796},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3946547210216522},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.18799954652786255},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.11830121278762817},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.08762320876121521}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcad.2025.3529820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2025.3529820","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4474951375","display_name":null,"funder_award_id":"2128149","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1973882569","https://openalex.org/W1975194220","https://openalex.org/W1987034518","https://openalex.org/W1989361845","https://openalex.org/W2073826979","https://openalex.org/W2083613288","https://openalex.org/W2119717200","https://openalex.org/W2145339207","https://openalex.org/W2150679822","https://openalex.org/W2152652532","https://openalex.org/W2268994915","https://openalex.org/W2770542984","https://openalex.org/W2798273231","https://openalex.org/W2804268686","https://openalex.org/W2897130165","https://openalex.org/W2901848761","https://openalex.org/W2903175372","https://openalex.org/W2904246096","https://openalex.org/W2971653768","https://openalex.org/W2985374077","https://openalex.org/W3000371584","https://openalex.org/W3013072087","https://openalex.org/W3013700197","https://openalex.org/W3034900101","https://openalex.org/W3036979375","https://openalex.org/W3046764219","https://openalex.org/W3090586977","https://openalex.org/W3096295711","https://openalex.org/W3097787172","https://openalex.org/W3112790703","https://openalex.org/W3117215073","https://openalex.org/W3127561923","https://openalex.org/W3171039560","https://openalex.org/W3185879101","https://openalex.org/W3187862527","https://openalex.org/W3201365832","https://openalex.org/W4308477919","https://openalex.org/W4380881139","https://openalex.org/W4386211404","https://openalex.org/W4386764660","https://openalex.org/W4388878451","https://openalex.org/W6601425427","https://openalex.org/W6770246895","https://openalex.org/W6803914020"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W3199500035","https://openalex.org/W3201059918"],"abstract_inverted_index":{"Online":[0],"deep":[1,138,148,172],"reinforcement":[2,29],"learning":[3,30,59,161,237],"(deep":[4],"RL)-based":[5],"systems":[6,60],"are":[7,94,184,214,226],"being":[8],"increasingly":[9],"deployed":[10],"in":[11,57,170,219],"a":[12,106,261],"variety":[13],"of":[14,22,49,66,118,159,196,249],"safety-critical":[15],"applications.":[16,101],"Due":[17],"to":[18,35,53,70,91,96,129,164,186,202,204,216,232],"the":[19,23,47,64,124,137,147,200,220,247,250],"dynamic":[20],"nature":[21],"environments":[24],"they":[25],"work":[26],"in,":[27],"onboard":[28,99],"(RL)":[31],"hardware":[32,88,262],"is":[33,75,244],"vulnerable":[34],"soft":[36],"errors":[37,169],"from":[38],"radiation,":[39],"thermal":[40],"effects":[41],"and":[42,167,234,252],"electrical":[43],"noise":[44],"that":[45,114],"corrupts":[46],"results":[48],"computations.":[50],"Existing":[51],"approaches":[52,85],"on-line":[54,209],"error":[55,108,131],"resilience":[56,72,109],"machine":[58],"have":[61],"relied":[62],"on":[63,146,156,254],"availability":[65],"large":[67],"training":[68,92,127,240],"datasets":[69],"configure":[71,130],"parameters.":[73],"This":[74],"not":[76],"always":[77],"feasible":[78],"for":[79,98,111,136],"online":[80,112,160,171,236],"RL":[81,100,113,126,139,149,173,210,256],"systems.":[82],"Similarly,":[83,142],"other":[84],"involving":[86],"specialized":[87],"or":[89,190],"modifications":[90],"algorithms":[93,257],"difficult":[95],"implement":[97],"In":[102,175],"contrast,":[103],"we":[104,143],"present":[105],"novel":[107],"approach":[110,243],"leverages":[115],"running":[116,153,182,197],"statistics":[117,183,198],"neuron":[119,188],"output":[120],"values":[121],"collected":[122],"across":[123],"(real-time)":[125],"process":[128],"detection":[132],"thresholds":[133,155],"(called":[134],"checks)":[135],"forward":[140,221],"pass.":[141,222],"formulate":[144],"checks":[145,201],"backward":[150],"pass":[151],"using":[152],"statistical":[154,178],"reduced-dimension":[157],"checksums":[158],"weight":[162,224,230],"updates":[163,225,231],"rapidly":[165],"detect":[166],"correct":[168],"training.":[174,211],"this":[176],"methodology,":[177],"concentration":[179],"bounds":[180],"leveraging":[181],"used":[185],"diagnose":[187],"outputs":[189],"weights":[191],"as":[192,258,260],"erroneous.":[193],"The":[194],"use":[195],"allows":[199],"adapt":[203],"changes":[205],"caused":[206],"by":[207],"continual":[208],"Erroneous":[212,223],"neurons":[213],"set":[215],"zero":[217],"(suppressed)":[218],"frozen,":[227],"allowing":[228,235],"nonerroneous":[229],"proceed":[233],"without":[238],"rerunning":[239],"episodes.":[241],"Our":[242],"compared":[245],"against":[246],"state":[248],"art":[251],"validated":[253],"several":[255],"well":[259],"validation":[263],"platform.":[264]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
