{"id":"https://openalex.org/W2589031991","doi":"https://doi.org/10.1109/ssci.2016.7849841","title":"Iterative Q-learning-based nonlinear optimal tracking control","display_name":"Iterative Q-learning-based nonlinear optimal tracking control","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2589031991","doi":"https://doi.org/10.1109/ssci.2016.7849841","mag":"2589031991"},"language":"en","primary_location":{"id":"doi:10.1109/ssci.2016.7849841","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci.2016.7849841","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087825639","display_name":"Qinglai Wei","orcid":"https://orcid.org/0000-0001-7002-9800"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qinglai Wei","raw_affiliation_strings":["The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","The State Key Laboratory of Management and Control for Complex Systems, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]},{"raw_affiliation_string":"The State Key Laboratory of Management and Control for Complex Systems, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040323322","display_name":"Ruizhuo Song","orcid":"https://orcid.org/0000-0002-6693-2738"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruizhuo Song","raw_affiliation_strings":["School of Automation and Electrical Engineering, University of Science and Technology Beijing, 100083, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, 100083, China","institution_ids":["https://openalex.org/I92403157"]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100981585","display_name":"Yancai Xu","orcid":"https://orcid.org/0000-0002-6953-0670"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yancai Xu","raw_affiliation_strings":["The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","The State Key Laboratory of Management and Control for Complex Systems, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Management and Control for Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]},{"raw_affiliation_string":"The State Key Laboratory of Management and Control for Complex Systems, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004057129","display_name":"Derong Liu","orcid":"https://orcid.org/0000-0003-3715-4778"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Derong Liu","raw_affiliation_strings":["School of Automation and Electrical Engineering, University of Science and Technology Beijing, 100083, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, 100083, China","institution_ids":["https://openalex.org/I92403157"]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5087825639"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210094879"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.17942209,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2016","issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9550999999046326,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/iterative-learning-control","display_name":"Iterative learning control","score":0.910239577293396},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.7297976016998291},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.6943639516830444},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.6093611717224121},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.5628249645233154},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5488345623016357},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5454027652740479},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4556879699230194},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.44972965121269226},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.44285085797309875},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.39524200558662415},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3491000831127167},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.336127370595932},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17763623595237732}],"concepts":[{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.910239577293396},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.7297976016998291},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.6943639516830444},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.6093611717224121},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.5628249645233154},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5488345623016357},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5454027652740479},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4556879699230194},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.44972965121269226},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.44285085797309875},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.39524200558662415},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3491000831127167},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.336127370595932},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17763623595237732},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ssci.2016.7849841","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci.2016.7849841","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},{"id":"mag:2789320897","is_oa":false,"landing_page_url":"http://jglobal.jst.go.jp/en/public/20090422/201702223354496834","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.7799999713897705}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W92805021","https://openalex.org/W639062186","https://openalex.org/W1968908471","https://openalex.org/W1983089547","https://openalex.org/W1986864433","https://openalex.org/W1991119064","https://openalex.org/W1997603681","https://openalex.org/W1999213690","https://openalex.org/W2010152647","https://openalex.org/W2011310556","https://openalex.org/W2019338681","https://openalex.org/W2041866840","https://openalex.org/W2045719273","https://openalex.org/W2048687352","https://openalex.org/W2060686658","https://openalex.org/W2093831009","https://openalex.org/W2097569048","https://openalex.org/W2100276679","https://openalex.org/W2142620596","https://openalex.org/W2152161277","https://openalex.org/W2156629001","https://openalex.org/W2160561608","https://openalex.org/W2189990206","https://openalex.org/W2245501338","https://openalex.org/W2249513906","https://openalex.org/W2329769476","https://openalex.org/W2415286101","https://openalex.org/W2490234001","https://openalex.org/W2501330048","https://openalex.org/W2963609304","https://openalex.org/W3011120880","https://openalex.org/W4205326910","https://openalex.org/W6648026111"],"related_works":["https://openalex.org/W4386994694","https://openalex.org/W4388738109","https://openalex.org/W2362901947","https://openalex.org/W2362086884","https://openalex.org/W1606071314","https://openalex.org/W2350210972","https://openalex.org/W2369126164","https://openalex.org/W1482785882","https://openalex.org/W2376218423","https://openalex.org/W2761624296"],"abstract_inverted_index":{"A":[0],"new":[1,45],"Q-learning":[2,46],"algorithm":[3,47],"is":[4,31,48],"developed":[5,49,90],"for":[6,40],"a":[7],"class":[8],"of":[9,59,67,87],"discrete-time":[10],"nonlinear":[11],"systems":[12],"in":[13,50],"this":[14],"paper":[15],"to":[16,33,52,83],"solve":[17],"the":[18,27,41,44,54,60,65,68,75,85,88],"infinite":[19],"horizon":[20],"optimal":[21,28,36,55],"tracking":[22,29],"problems.":[23],"Using":[24],"system":[25],"transformations,":[26],"problem":[30],"transformed":[32],"be":[34],"an":[35],"regulation":[37,42],"problem.":[38],"Thereafter,":[39],"system,":[43],"order":[51],"obtain":[53],"control":[56,70],"law.":[57],"Convergence":[58],"iterative":[61,69],"Q":[62],"functions":[63],"and":[64],"admissibility":[66],"law":[71],"are":[72,81],"analyzed.":[73],"In":[74],"end,":[76],"two":[77],"corresponding":[78],"simulation":[79],"examples":[80],"presented":[82],"illustrate":[84],"performance":[86],"newly":[89],"algorithm.":[91]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
