{"id":"https://openalex.org/W4402568251","doi":"https://doi.org/10.1109/tase.2024.3456239","title":"Synthesis of Opacity-Enforcing Supervisory Strategies Using Reinforcement Learning","display_name":"Synthesis of Opacity-Enforcing Supervisory Strategies Using Reinforcement Learning","publication_year":2024,"publication_date":"2024-09-17","ids":{"openalex":"https://openalex.org/W4402568251","doi":"https://doi.org/10.1109/tase.2024.3456239"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2024.3456239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3456239","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100724839","display_name":"Huimin Zhang","orcid":"https://orcid.org/0000-0001-5692-346X"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Huimin Zhang","raw_affiliation_strings":["Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063035156","display_name":"Li Huang","orcid":"https://orcid.org/0000-0002-8454-9839"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Huang","raw_affiliation_strings":["Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112280690","display_name":"Wanling Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wanling Huang","raw_affiliation_strings":["Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054955661","display_name":"Lei Feng","orcid":"https://orcid.org/0000-0001-5703-5923"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Lei Feng","raw_affiliation_strings":["Department of Machine Design, KTH Royal Institute of Technology, Stockholm, Sweden"],"affiliations":[{"raw_affiliation_string":"Department of Machine Design, KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037037839","display_name":"Xianxian Li","orcid":"https://orcid.org/0000-0002-7083-3847"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianxian Li","raw_affiliation_strings":["Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Education Blockchain and Intelligent Technology, Ministry of Education, and Guangxi Key Laboratory of Multi-Source Information Mining and Security, Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100724839"],"corresponding_institution_ids":["https://openalex.org/I29739308"],"apc_list":null,"apc_paid":null,"fwci":0.7,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.69418711,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"22","issue":null,"first_page":"6896","last_page":"6906"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.3528999984264374,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.3528999984264374,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/supervisory-control","display_name":"Supervisory control","score":0.7622803449630737},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6065828800201416},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.505540132522583},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4583016037940979},{"id":"https://openalex.org/keywords/opacity","display_name":"Opacity","score":0.4562564492225647},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.44281813502311707},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3415754437446594},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.32964181900024414},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2585957646369934},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.14418485760688782}],"concepts":[{"id":"https://openalex.org/C92991967","wikidata":"https://www.wikidata.org/wiki/Q7644329","display_name":"Supervisory control","level":3,"score":0.7622803449630737},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6065828800201416},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.505540132522583},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4583016037940979},{"id":"https://openalex.org/C60056205","wikidata":"https://www.wikidata.org/wiki/Q691914","display_name":"Opacity","level":2,"score":0.4562564492225647},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.44281813502311707},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3415754437446594},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.32964181900024414},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2585957646369934},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.14418485760688782},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2024.3456239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3456239","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4248438916","display_name":null,"funder_award_id":"62103114","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G500372149","display_name":null,"funder_award_id":"U21A20474","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1502177156","https://openalex.org/W1505804150","https://openalex.org/W1562284768","https://openalex.org/W1575632017","https://openalex.org/W2064886960","https://openalex.org/W2090821252","https://openalex.org/W2101008541","https://openalex.org/W2125612430","https://openalex.org/W2126295866","https://openalex.org/W2145339207","https://openalex.org/W2162000948","https://openalex.org/W2163119090","https://openalex.org/W2440113315","https://openalex.org/W2509841691","https://openalex.org/W2768035641","https://openalex.org/W2912987268","https://openalex.org/W3011778292","https://openalex.org/W3035268587","https://openalex.org/W3112467125","https://openalex.org/W3185247296","https://openalex.org/W3207178583","https://openalex.org/W3214913876","https://openalex.org/W4288853474","https://openalex.org/W4312717216","https://openalex.org/W4320915023","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W2161791806","https://openalex.org/W2073474947","https://openalex.org/W4366824690","https://openalex.org/W2613656770","https://openalex.org/W2482431380","https://openalex.org/W2082077321","https://openalex.org/W2053059436","https://openalex.org/W128397461","https://openalex.org/W2159706408","https://openalex.org/W2613820654"],"abstract_inverted_index":{"In":[0,375],"the":[1,27,32,45,48,52,60,63,76,80,90,121,127,132,138,142,153,162,165,190,193,196,211,280,292,301,305,314,339,345,349,359,367,376,379,382,387,402,409,426],"control":[2,19,77,295,420],"of":[3,26,51,59,79,99,111,126,164,189,195,255,260,282,286,294,316,381,389],"discrete-event":[4],"systems":[5,261],"for":[6,41,176,218,248,273,358,422],"current-state":[7,249],"opacity":[8,42,177,221,250,357,423],"enforcement,":[9],"it":[10],"is":[11,54,65,85,92,129,150,179,336,363,405],"difficult":[12],"to":[13,37,75,87,119,130,160,228,237,323,355,365,398,415,418],"synthesize":[14,238],"a":[15,97,174,207,215,271,309],"supervisor":[16,175,274],"by":[17,136,181,252],"supervisory":[18,39,148,201],"theory":[20],"(SCT)":[21,232],"without":[22,184,203],"explicit":[23,186,245],"formal":[24,187,204,258,284],"models":[25,205,247,259,285],"systems.":[28,226,256,287],"This":[29,268,395],"study":[30],"utilizes":[31],"reinforcement":[33,277],"learning":[34,143,278],"(RL)":[35],"method":[36,198,272,290],"obtain":[38],"policies":[40,202,421],"enforcement":[43,178,222,251,424],"in":[44,62,141,199,210,220,223,279,297,304,369,425],"case":[46,281],"when":[47,152,401],"automaton":[49],"model":[50,188],"system":[53,69,105,246,340],"unavailable.":[55,267],"The":[56,109,124,168,288,318,334],"state":[57],"space":[58],"environment":[61],"RL":[64,182,325],"dynamically":[66],"generated":[67],"through":[68,308],"simulation.":[70],"Actions":[71],"are":[72,102,117,158,170,262],"defined":[73],"according":[74],"patterns":[78,296],"SCT.":[81],"A":[82],"reward":[83,135,310],"function":[84],"proposed":[86,122,166,197,289],"evaluate":[88],"whether":[89],"secret":[91],"exposed":[93],"or":[94,265],"not.":[95],"Then,":[96,145],"sequence":[98],"state-action-reward":[100],"chains":[101],"obtained":[103,151],"as":[104,328,338],"simulation":[106,341],"goes":[107,342],"on.":[108,343],"frameworks":[110,326],"Q-learning":[112,329,371],"and":[113,213,299,330,372,391],"State-Action-Reward-State-Action":[114,331],"(SARSA)":[115,332],"algorithms":[116],"adopted":[118],"implement":[120],"approach.":[123,167],"goal":[125],"training":[128,154,183,306,335,346],"maximize":[131],"total":[133],"accumulative":[134],"optimizing":[137],"action":[139,302],"selection":[140,303],"process.":[144],"an":[146,185,234],"optimal":[147,350],"policy":[149,351],"process":[155,307,347],"converges.":[156],"Experiments":[157],"performed":[159,337],"illustrate":[161],"effectiveness":[163],"contributions":[169],"two":[171],"aspects.":[172],"Firstly,":[173],"learned":[180],"system.":[191,360],"Secondly,":[192],"ability":[194],"computing":[200],"addresses":[206],"significant":[208],"gap":[209],"literature":[212],"offers":[214],"new":[216],"direction":[217],"research":[219],"discrete":[224],"event":[225],"Note":[227],"Practitioners\u2014Supervisory":[229],"Control":[230],"Theory":[231],"supplies":[233],"effective":[235],"way":[236],"supervisors,":[239],"which":[240],"traditionally":[241],"handles":[242],"tasks":[243],"with":[244,386],"restricting":[253],"behavior":[254],"However,":[257,361],"often":[263],"confidential":[264],"otherwise":[266],"paper":[269],"presents":[270],"synthesis":[275],"via":[276],"lacking":[283],"leverages":[291],"characteristics":[293],"SCT":[298],"optimizes":[300],"mechanism":[311],"that":[312],"evaluates":[313],"secrecy":[315],"states.":[317],"approach":[319,410],"can":[320,352,396],"be":[321,353],"applied":[322],"model-free":[324],"such":[327],"algorithms.":[333,374],"When":[344],"converges,":[348],"used":[354,364],"enforce":[356],"Q-table":[362,383],"save":[366],"Q-value":[368],"both":[370],"SARSA":[373],"worst":[377],"case,":[378],"size":[380],"grows":[384],"exponentially":[385],"number":[388],"states":[390],"controllable":[392],"events":[393],"increasing.":[394],"lead":[397],"memory":[399],"exhaustion":[400],"system\u2019s":[403],"scale":[404],"large.":[406],"To":[407],"make":[408],"scalable,":[411],"we":[412],"will":[413],"attempt":[414],"use":[416],"DRL":[417],"train":[419],"future.":[427]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
