{"id":"https://openalex.org/W4287845909","doi":"https://doi.org/10.1109/icca54724.2022.9831833","title":"Model-Assisted Reinforcement Learning for Online Diagnostics in Stochastic Controlled Systems","display_name":"Model-Assisted Reinforcement Learning for Online Diagnostics in Stochastic Controlled Systems","publication_year":2022,"publication_date":"2022-06-27","ids":{"openalex":"https://openalex.org/W4287845909","doi":"https://doi.org/10.1109/icca54724.2022.9831833"},"language":"en","primary_location":{"id":"doi:10.1109/icca54724.2022.9831833","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icca54724.2022.9831833","pdf_url":null,"source":{"id":"https://openalex.org/S4363608132","display_name":"2022 IEEE 17th International Conference on Control &amp; Automation (ICCA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 17th International Conference on Control &amp; Automation (ICCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051837539","display_name":"Erfaun Noorani","orcid":"https://orcid.org/0000-0002-5171-122X"},"institutions":[{"id":"https://openalex.org/I173498003","display_name":"Palo Alto Research Center","ror":"https://ror.org/0529fxt39","country_code":"US","type":"facility","lineage":["https://openalex.org/I173498003","https://openalex.org/I4210132870"]},{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Erfaun Noorani","raw_affiliation_strings":["A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","Department of Electrical and Computer Engineering, the Institute for System Research (ISR) at the University of Maryland College Park, College Park, MD, USA","Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I173498003"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, the Institute for System Research (ISR) at the University of Maryland College Park, College Park, MD, USA","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I173498003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080167889","display_name":"Christoforos Somarakis","orcid":"https://orcid.org/0000-0003-4601-2501"},"institutions":[{"id":"https://openalex.org/I173498003","display_name":"Palo Alto Research Center","ror":"https://ror.org/0529fxt39","country_code":"US","type":"facility","lineage":["https://openalex.org/I173498003","https://openalex.org/I4210132870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christoforos Somarakis","raw_affiliation_strings":["A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I173498003"]},{"raw_affiliation_string":"Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I173498003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072338368","display_name":"Raman Goyal","orcid":"https://orcid.org/0000-0002-8128-3051"},"institutions":[{"id":"https://openalex.org/I173498003","display_name":"Palo Alto Research Center","ror":"https://ror.org/0529fxt39","country_code":"US","type":"facility","lineage":["https://openalex.org/I173498003","https://openalex.org/I4210132870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Raman Goyal","raw_affiliation_strings":["A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I173498003"]},{"raw_affiliation_string":"Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I173498003"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109362391","display_name":"Alexander Feldman","orcid":null},"institutions":[{"id":"https://openalex.org/I173498003","display_name":"Palo Alto Research Center","ror":"https://ror.org/0529fxt39","country_code":"US","type":"facility","lineage":["https://openalex.org/I173498003","https://openalex.org/I4210132870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexander Feldman","raw_affiliation_strings":["A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I173498003"]},{"raw_affiliation_string":"Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I173498003"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035310261","display_name":"Shantanu Rane","orcid":"https://orcid.org/0009-0003-6319-1764"},"institutions":[{"id":"https://openalex.org/I173498003","display_name":"Palo Alto Research Center","ror":"https://ror.org/0529fxt39","country_code":"US","type":"facility","lineage":["https://openalex.org/I173498003","https://openalex.org/I4210132870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shantanu Rane","raw_affiliation_strings":["A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"A Xerox Company,Palo Alto Research Center,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I173498003"]},{"raw_affiliation_string":"Palo Alto Research Center, A Xerox Company, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I173498003"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.07285168,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"338","last_page":"345"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9664999842643738,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9664999842643738,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9552000164985657,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/linear-quadratic-gaussian-control","display_name":"Linear-quadratic-Gaussian control","score":0.8620954155921936},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8251705169677734},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6957912445068359},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5163401365280151},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.4822319447994232},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.46664953231811523},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.42503461241722107},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4103849530220032},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2901070713996887},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.21373659372329712},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1761922538280487}],"concepts":[{"id":"https://openalex.org/C204495892","wikidata":"https://www.wikidata.org/wiki/Q1798304","display_name":"Linear-quadratic-Gaussian control","level":3,"score":0.8620954155921936},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8251705169677734},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6957912445068359},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5163401365280151},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.4822319447994232},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.46664953231811523},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.42503461241722107},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4103849530220032},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2901070713996887},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.21373659372329712},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1761922538280487},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icca54724.2022.9831833","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icca54724.2022.9831833","pdf_url":null,"source":{"id":"https://openalex.org/S4363608132","display_name":"2022 IEEE 17th International Conference on Control &amp; Automation (ICCA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 17th International Conference on Control &amp; Automation (ICCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W1999291921","https://openalex.org/W2107169685","https://openalex.org/W2115005925","https://openalex.org/W4245839115","https://openalex.org/W2111439273","https://openalex.org/W1998777431","https://openalex.org/W2101783086","https://openalex.org/W2037500647","https://openalex.org/W2466810109","https://openalex.org/W2000675896"],"abstract_inverted_index":{"A":[0],"mechanism":[1],"to":[2,21,57,67],"protect":[3],"a":[4,11,36,72,92,111,121],"controlled":[5,45,119],"system":[6,65],"in":[7,34,144,150,155],"the":[8,19,64,76,80,87,98,140,148],"event":[9],"of":[10,79,100,114],"priori":[12],"unknown":[13,59],"abnormalities":[14],"(e.g.":[15],"faults,":[16],"attacks)":[17],"is":[18,142],"key":[20],"designing":[22],"resilient":[23],"and":[24,54,70,146],"robust":[25],"control":[26,31],"systems.":[27],"We":[28,62,83],"explore":[29],"bi-level":[30],"design":[32,73],"architectures":[33],"which":[35],"supervisory":[37],"Reinforcement":[38],"Learning":[39],"(RL)":[40],"agent":[41,49],"augments":[42],"an":[43,115,156],"over-observed":[44,116],"system.":[46],"The":[47],"RL":[48,81],"monitors":[50],"sensor":[51,60,103],"signals,":[52],"detects":[53],"takes":[55],"action":[56],"mitigate":[58],"faults.":[61,104],"use":[63],"dynamics":[66],"extract":[68],"features":[69],"develop":[71],"method":[74],"for":[75],"cost":[77,89],"function":[78,90],"module.":[82],"theoretically":[84],"show":[85,138],"that":[86,96,139],"designed":[88],"has":[91],"unique":[93],"optimal":[94],"policy":[95],"enables":[97],"diagnosis":[99],"arbitrary":[101],"constant":[102],"To":[105],"conceptualize":[106],"our":[107,135],"architecture,":[108],"we":[109],"consider":[110],"linear":[112],"version":[113],"chemical":[117],"process,":[118],"by":[120],"Linear":[122],"Quadratic":[123],"Gaussian":[124],"(LQG)":[125],"Servo-Controller":[126],"with":[127,134],"Integral":[128],"Action.":[129],"Our":[130],"experimental":[131],"results,":[132],"coupled":[133],"theoretical":[136],"analysis,":[137],"RL-agent":[141],"successful":[143],"identifying":[145],"mitigating":[147],"faults":[149],"one":[151],"or":[152],"more":[153],"sensors":[154],"online":[157],"fashion.":[158]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
