{"id":"https://openalex.org/W2041626001","doi":"https://doi.org/10.1109/tcst.2014.2322778","title":"Adaptive Suboptimal Output-Feedback Control for Linear Systems Using Integral Reinforcement Learning","display_name":"Adaptive Suboptimal Output-Feedback Control for Linear Systems Using Integral Reinforcement Learning","publication_year":2014,"publication_date":"2014-06-03","ids":{"openalex":"https://openalex.org/W2041626001","doi":"https://doi.org/10.1109/tcst.2014.2322778","mag":"2041626001"},"language":"en","primary_location":{"id":"doi:10.1109/tcst.2014.2322778","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2014.2322778","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050679356","display_name":"Lemei M. Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I132210918","display_name":"North China Institute of Science and Technology","ror":"https://ror.org/0096c7651","country_code":"CN","type":"education","lineage":["https://openalex.org/I132210918"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lemei M. Zhu","raw_affiliation_strings":["Department of Basic, North China Institute of Science and Technology, Hebei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Basic, North China Institute of Science and Technology, Hebei, China","institution_ids":["https://openalex.org/I132210918"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063118155","display_name":"Hamidreza Modares","orcid":"https://orcid.org/0000-0003-0800-5140"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hamidreza Modares","raw_affiliation_strings":["Arlington Research Institute, University of Texas, Fort Worth, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Arlington Research Institute, University of Texas, Fort Worth, TX, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010829346","display_name":"Gan Oon Peen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091207","display_name":"Singapore Institute of Manufacturing Technology","ror":"https://ror.org/00f44np30","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I4210091207","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Gan Oon Peen","raw_affiliation_strings":["Singapore Institute of Manufacturing Technology, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Singapore Institute of Manufacturing Technology, Singapore","institution_ids":["https://openalex.org/I4210091207"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016137188","display_name":"Frank L. Lewis","orcid":"https://orcid.org/0000-0003-4074-1615"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Frank L. Lewis","raw_affiliation_strings":["Arlington Research Institute, University of Texas, Fort Worth, TX, USA","State Key Laboratory of Synthetical Process Automation, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Arlington Research Institute, University of Texas, Fort Worth, TX, USA","institution_ids":[]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Process Automation, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101580741","display_name":"Baozeng Yue","orcid":"https://orcid.org/0000-0003-0448-915X"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baozeng Yue","raw_affiliation_strings":["Department of Mechanics, Beijing Institute of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mechanics, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5050679356"],"corresponding_institution_ids":["https://openalex.org/I132210918"],"apc_list":null,"apc_paid":null,"fwci":3.6703,"has_fulltext":false,"cited_by_count":100,"citation_normalized_percentile":{"value":0.93090548,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"23","issue":"1","first_page":"264","last_page":"273"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9696000218391418,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10675","display_name":"Mechanical Circulatory Support Devices","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7941102981567383},{"id":"https://openalex.org/keywords/observer","display_name":"Observer (physics)","score":0.6873422861099243},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.6618157625198364},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6570920348167419},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6317227482795715},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5520810484886169},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4968254864215851},{"id":"https://openalex.org/keywords/output-feedback","display_name":"Output feedback","score":0.47671929001808167},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.45795002579689026},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.41636529564857483},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.410581111907959},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18066036701202393}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7941102981567383},{"id":"https://openalex.org/C2780704645","wikidata":"https://www.wikidata.org/wiki/Q9251458","display_name":"Observer (physics)","level":2,"score":0.6873422861099243},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.6618157625198364},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6570920348167419},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6317227482795715},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5520810484886169},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4968254864215851},{"id":"https://openalex.org/C3018623182","wikidata":"https://www.wikidata.org/wiki/Q154021","display_name":"Output feedback","level":3,"score":0.47671929001808167},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.45795002579689026},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.41636529564857483},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.410581111907959},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18066036701202393},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcst.2014.2322778","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2014.2322778","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2193311593","display_name":null,"funder_award_id":"ECCS-1128050","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5188019245","display_name":null,"funder_award_id":"IIS-1208623","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6900036684","display_name":null,"funder_award_id":"61120106011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G836722894","display_name":null,"funder_award_id":"N00014-13-1-0562","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W601351931","https://openalex.org/W1510580798","https://openalex.org/W1616818660","https://openalex.org/W1907796993","https://openalex.org/W1972243698","https://openalex.org/W1983523797","https://openalex.org/W2013895638","https://openalex.org/W2014729048","https://openalex.org/W2017570421","https://openalex.org/W2019478222","https://openalex.org/W2024303516","https://openalex.org/W2037025184","https://openalex.org/W2037539475","https://openalex.org/W2048687352","https://openalex.org/W2050838777","https://openalex.org/W2057491769","https://openalex.org/W2060605484","https://openalex.org/W2071004621","https://openalex.org/W2081514674","https://openalex.org/W2085194340","https://openalex.org/W2087063454","https://openalex.org/W2124829859","https://openalex.org/W2137547645","https://openalex.org/W2138718561","https://openalex.org/W2148439597","https://openalex.org/W2151966330","https://openalex.org/W2152161277","https://openalex.org/W2165501837","https://openalex.org/W2167322332","https://openalex.org/W2321292752","https://openalex.org/W2484646121","https://openalex.org/W2487144912","https://openalex.org/W3011120880","https://openalex.org/W3213472335","https://openalex.org/W4214717370","https://openalex.org/W6775686901","https://openalex.org/W6804409665"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W1965722305","https://openalex.org/W1991810297","https://openalex.org/W2032253950","https://openalex.org/W1819950161","https://openalex.org/W4200410877"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,45,142],"(RL)":[2],"techniques":[3],"have":[4],"been":[5],"successfully":[6],"used":[7,118],"to":[8,27,36,54,82,119,152],"find":[9,55],"optimal":[10],"state-feedback":[11],"controllers":[12],"for":[13,60,127],"continuous-time":[14],"(CT)":[15],"systems.":[16,65],"However,":[17,134],"in":[18,75,79],"most":[19],"real-world":[20,170],"control":[21],"applications,":[22,171],"it":[23,33],"is":[24,34,107,117,137,144],"not":[25,108,138],"practical":[26],"measure":[28],"the":[29,49,89,93,97,103,111,121,124,128,135,141,149,158,161,173,177],"system":[30,104],"states":[31,126],"and":[32,87,157,176],"desirable":[35],"design":[37],"output-feedback":[38,58,85,90,155],"controllers.":[39],"This":[40],"paper":[41],"develops":[42],"an":[43,71,84],"online":[44,78],"algorithm":[46,69,151],"based":[47],"on":[48,168],"integral":[50],"RL":[51],"(IRL)":[52],"technique":[53],"a":[56,153],"suboptimal":[57,154],"controller":[59],"partially":[61],"unknown":[62],"CT":[63],"linear":[64],"The":[66,100,146],"proposed":[67,112,150,162],"IRL-based":[68],"solves":[70],"IRL":[72,129],"Bellman":[73,130],"equation":[74,131],"each":[76],"iteration":[77],"real":[80],"time":[81],"evaluate":[83],"policy":[86],"updates":[88],"gain":[91],"using":[92],"information":[94],"given":[95],"by":[96,110],"evaluated":[98],"policy.":[99],"knowledge":[101,122],"of":[102,123,148,160],"drift":[105],"dynamics":[106],"required":[109],"method.":[113],"An":[114],"adaptive":[115],"observer":[116,136],"provide":[120],"full":[125],"during":[132],"learning.":[133],"needed":[139],"after":[140],"process":[143],"finished.":[145],"convergence":[147],"solution":[156],"performance":[159],"method":[163],"are":[164],"verified":[165],"through":[166],"simulation":[167],"two":[169],"namely,":[172],"X-Y":[174],"table":[175],"F-16":[178],"aircraft.":[179]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":15},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":5}],"updated_date":"2026-05-14T08:36:36.166977","created_date":"2025-10-10T00:00:00"}
