{"id":"https://openalex.org/W7123343226","doi":"https://doi.org/10.1109/tsmc.2025.3649181","title":"Reinforcement Learning Optimal Output Feedback Control for Takagi\u2013Sugeno Fuzzy Systems With Disturbances","display_name":"Reinforcement Learning Optimal Output Feedback Control for Takagi\u2013Sugeno Fuzzy Systems With Disturbances","publication_year":2026,"publication_date":"2026-01-12","ids":{"openalex":"https://openalex.org/W7123343226","doi":"https://doi.org/10.1109/tsmc.2025.3649181"},"language":null,"primary_location":{"id":"doi:10.1109/tsmc.2025.3649181","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3649181","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122861130","display_name":"Yifan Deng","orcid":null},"institutions":[{"id":"https://openalex.org/I2898894","display_name":"Liaoning University of Technology","ror":"https://ror.org/05ay23762","country_code":"CN","type":"education","lineage":["https://openalex.org/I2898894"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifan Deng","raw_affiliation_strings":["College of Science, Liaoning University of Technology, Jinzhou, China"],"raw_orcid":"https://orcid.org/0009-0004-6360-0019","affiliations":[{"raw_affiliation_string":"College of Science, Liaoning University of Technology, Jinzhou, China","institution_ids":["https://openalex.org/I2898894"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082246866","display_name":"Wenting Song","orcid":"https://orcid.org/0000-0001-9521-4746"},"institutions":[{"id":"https://openalex.org/I2898894","display_name":"Liaoning University of Technology","ror":"https://ror.org/05ay23762","country_code":"CN","type":"education","lineage":["https://openalex.org/I2898894"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenting Song","raw_affiliation_strings":["College of Science, Liaoning University of Technology, Jinzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-9521-4746","affiliations":[{"raw_affiliation_string":"College of Science, Liaoning University of Technology, Jinzhou, China","institution_ids":["https://openalex.org/I2898894"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114214539","display_name":"Shaocheng Tong","orcid":"https://orcid.org/0000-0002-7366-7805"},"institutions":[{"id":"https://openalex.org/I2898894","display_name":"Liaoning University of Technology","ror":"https://ror.org/05ay23762","country_code":"CN","type":"education","lineage":["https://openalex.org/I2898894"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaocheng Tong","raw_affiliation_strings":["College of Science, Liaoning University of Technology, Jinzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7366-7805","affiliations":[{"raw_affiliation_string":"College of Science, Liaoning University of Technology, Jinzhou, China","institution_ids":["https://openalex.org/I2898894"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08074504,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"56","issue":"4","first_page":"2297","last_page":"2307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9467999935150146,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9467999935150146,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12277","display_name":"Frequency Control in Power Systems","score":0.006800000090152025,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.005799999926239252,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.8123999834060669},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.5978999733924866},{"id":"https://openalex.org/keywords/fuzzy-control-system","display_name":"Fuzzy control system","score":0.5527999997138977},{"id":"https://openalex.org/keywords/fuzzy-logic","display_name":"Fuzzy logic","score":0.5422999858856201},{"id":"https://openalex.org/keywords/observer","display_name":"Observer (physics)","score":0.5400999784469604},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5388000011444092},{"id":"https://openalex.org/keywords/differential-game","display_name":"Differential game","score":0.47530001401901245},{"id":"https://openalex.org/keywords/output-feedback","display_name":"Output feedback","score":0.4487000107765198},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4262000024318695}],"concepts":[{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.8123999834060669},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.5978999733924866},{"id":"https://openalex.org/C195975749","wikidata":"https://www.wikidata.org/wiki/Q1475705","display_name":"Fuzzy control system","level":3,"score":0.5527999997138977},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.5422999858856201},{"id":"https://openalex.org/C2780704645","wikidata":"https://www.wikidata.org/wiki/Q9251458","display_name":"Observer (physics)","level":2,"score":0.5400999784469604},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5388000011444092},{"id":"https://openalex.org/C2779006483","wikidata":"https://www.wikidata.org/wiki/Q1973196","display_name":"Differential game","level":2,"score":0.47530001401901245},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47189998626708984},{"id":"https://openalex.org/C3018623182","wikidata":"https://www.wikidata.org/wiki/Q154021","display_name":"Output feedback","level":3,"score":0.4487000107765198},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4262000024318695},{"id":"https://openalex.org/C13847129","wikidata":"https://www.wikidata.org/wiki/Q4723989","display_name":"Algebraic Riccati equation","level":4,"score":0.42149999737739563},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4101000130176544},{"id":"https://openalex.org/C45473103","wikidata":"https://www.wikidata.org/wiki/Q851503","display_name":"Riccati equation","level":3,"score":0.3779999911785126},{"id":"https://openalex.org/C98779006","wikidata":"https://www.wikidata.org/wiki/Q2520550","display_name":"Linear-quadratic regulator","level":3,"score":0.37450000643730164},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.36039999127388},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3571000099182129},{"id":"https://openalex.org/C9376300","wikidata":"https://www.wikidata.org/wiki/Q168817","display_name":"Algebraic number","level":2,"score":0.3422999978065491},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.32899999618530273},{"id":"https://openalex.org/C204495892","wikidata":"https://www.wikidata.org/wiki/Q1798304","display_name":"Linear-quadratic-Gaussian control","level":3,"score":0.31610000133514404},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C184652730","wikidata":"https://www.wikidata.org/wiki/Q2357982","display_name":"Attenuation","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2547999918460846}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2025.3649181","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3649181","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G37309136","display_name":null,"funder_award_id":"62173172","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7655133018","display_name":null,"funder_award_id":"62573216","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1967793246","https://openalex.org/W1989555277","https://openalex.org/W1998361253","https://openalex.org/W2055891887","https://openalex.org/W2139416664","https://openalex.org/W2148885430","https://openalex.org/W2570103416","https://openalex.org/W2767307332","https://openalex.org/W2897702175","https://openalex.org/W2907944110","https://openalex.org/W2914172002","https://openalex.org/W2917322258","https://openalex.org/W3091794548","https://openalex.org/W3127008750","https://openalex.org/W3172934943","https://openalex.org/W3205613298","https://openalex.org/W4206037914","https://openalex.org/W4210687955","https://openalex.org/W4310329823","https://openalex.org/W4361852720","https://openalex.org/W4364856517","https://openalex.org/W4383113468","https://openalex.org/W4386523235","https://openalex.org/W4391341148","https://openalex.org/W4392504543","https://openalex.org/W4397026485","https://openalex.org/W4398226372","https://openalex.org/W4403123655","https://openalex.org/W4403209848","https://openalex.org/W4406117312","https://openalex.org/W4406610537","https://openalex.org/W4408711313"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"article,":[2],"we":[3,125],"study":[4],"the":[5,32,39,58,95,101,112,120,127,137,141,144],"reinforcement":[6],"learning":[7,87],"(RL)":[8],"optimal":[9,44,60,105,129],"output":[10,45,81,106],"feedback":[11,46,82,107],"control":[12,47,61,108,130],"problem":[13],"for":[14],"Takagi\u2013Sugeno":[15],"(T\u2013S)":[16],"fuzzy":[17,25,43,103],"systems":[18,114],"with":[19],"immeasurable":[20,33],"states":[21],"and":[22,35,100,118,136],"disturbances.":[23],"A":[24],"filtering":[26,40],"observer":[27],"is":[28,49,73,89,92,98],"designed":[29],"to":[30,65,75,132],"estimate":[31],"states,":[34],"then,":[36],"based":[37],"on":[38],"observer,":[41],"a":[42,133],"method":[48,131],"presented":[50],"by":[51],"employing":[52],"zero-sum":[53],"differential":[54],"game":[55,67],"theory.":[56],"Since":[57],"analytical":[59,78],"solutions":[62],"are":[63],"reduced":[64],"solving":[66],"algebraic":[68],"Riccati":[69],"equations":[70],"(GAREs),":[71],"which":[72],"difficult":[74],"obtain":[76],"their":[77],"solutions,":[79],"an":[80],"model-free":[83],"policy":[84],"iteration":[85],"(PI)":[86],"algorithm":[88,97],"proposed.":[90],"It":[91],"proved":[93],"that":[94],"proposed":[96,102],"convergent":[99],"RL":[104],"approach":[109],"can":[110],"make":[111],"controlled":[113],"be":[115],"asymptotically":[116],"stable":[117],"satisfy":[119],"disturbance":[121],"attenuation":[122],"condition.":[123],"Finally,":[124],"apply":[126],"developed":[128,145],"mass\u2013spring\u2013damper":[134],"system,":[135],"simulation":[138],"results":[139],"verify":[140],"effectiveness":[142],"of":[143],"method.":[146]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-14T00:00:00"}
