{"id":"https://openalex.org/W4402350252","doi":"https://doi.org/10.1109/tase.2024.3453926","title":"Adaptive Critic Control With Knowledge Transfer for Uncertain Nonlinear Dynamical Systems: A Reinforcement Learning Approach","display_name":"Adaptive Critic Control With Knowledge Transfer for Uncertain Nonlinear Dynamical Systems: A Reinforcement Learning Approach","publication_year":2024,"publication_date":"2024-09-09","ids":{"openalex":"https://openalex.org/W4402350252","doi":"https://doi.org/10.1109/tase.2024.3453926"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2024.3453926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3453926","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090452583","display_name":"Zhang Liangju","orcid":"https://orcid.org/0009-0001-7252-6656"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liangju Zhang","raw_affiliation_strings":["College of Automatic and the College of Artificial Intelligence, Nanjing University of Posts and Telecommunications, Nanjing, Jiangsu, China"],"affiliations":[{"raw_affiliation_string":"College of Automatic and the College of Artificial Intelligence, Nanjing University of Posts and Telecommunications, Nanjing, Jiangsu, China","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100342397","display_name":"Kun Zhang","orcid":"https://orcid.org/0009-0008-9929-7700"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Zhang","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113373529","display_name":"Xiang Peng Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Peng Xie","raw_affiliation_strings":["School of Internet of Things, Nanjing University of Posts and Telecommunications, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Internet of Things, Nanjing University of Posts and Telecommunications, Nanjing, China","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013750149","display_name":"Mohammed Chadli","orcid":"https://orcid.org/0000-0002-0140-5187"},"institutions":[{"id":"https://openalex.org/I4210107733","display_name":"Informatique, Biologie Int\u00e9grative et Syst\u00e8mes Complexes","ror":"https://ror.org/01aqxgr98","country_code":"FR","type":"facility","lineage":["https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210107733","https://openalex.org/I88467170"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Mohammed Chadli","raw_affiliation_strings":["IBISC Laboratory, University of Paris-Saclay, &#x00C9;vry, France"],"affiliations":[{"raw_affiliation_string":"IBISC Laboratory, University of Paris-Saclay, &#x00C9;vry, France","institution_ids":["https://openalex.org/I4210107733","https://openalex.org/I277688954"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5090452583"],"corresponding_institution_ids":["https://openalex.org/I41198531"],"apc_list":null,"apc_paid":null,"fwci":1.5217,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.84492694,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"22","issue":null,"first_page":"6752","last_page":"6761"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9642999768257141,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9642999768257141,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.932200014591217,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6571833491325378},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.6479827165603638},{"id":"https://openalex.org/keywords/nonlinear-dynamical-systems","display_name":"Nonlinear dynamical systems","score":0.6214933395385742},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.573920488357544},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5691147446632385},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5002572536468506},{"id":"https://openalex.org/keywords/dynamical-systems-theory","display_name":"Dynamical systems theory","score":0.4980776309967041},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4514637291431427},{"id":"https://openalex.org/keywords/transfer-function","display_name":"Transfer function","score":0.4228639602661133},{"id":"https://openalex.org/keywords/control-system","display_name":"Control system","score":0.41829633712768555},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3996187448501587},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3844365179538727},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.28453272581100464},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.13604065775871277}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6571833491325378},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.6479827165603638},{"id":"https://openalex.org/C2983030100","wikidata":"https://www.wikidata.org/wiki/Q638328","display_name":"Nonlinear dynamical systems","level":3,"score":0.6214933395385742},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.573920488357544},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5691147446632385},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5002572536468506},{"id":"https://openalex.org/C79379906","wikidata":"https://www.wikidata.org/wiki/Q3174497","display_name":"Dynamical systems theory","level":2,"score":0.4980776309967041},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4514637291431427},{"id":"https://openalex.org/C81299745","wikidata":"https://www.wikidata.org/wiki/Q334269","display_name":"Transfer function","level":2,"score":0.4228639602661133},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.41829633712768555},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3996187448501587},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3844365179538727},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.28453272581100464},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13604065775871277},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tase.2024.3453926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3453926","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-04986152v1","is_oa":false,"landing_page_url":"https://hal.science/hal-04986152","pdf_url":null,"source":{"id":"https://openalex.org/S4406922466","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Automation Science and Engineering, 2025, 22, pp.6752--6761. &#x27E8;10.1109/TASE.2024.3453926&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2680715701","display_name":null,"funder_award_id":"62103408","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3790867977","display_name":null,"funder_award_id":"62022044","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7261126740","display_name":null,"funder_award_id":"62373196","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W173093232","https://openalex.org/W1493260514","https://openalex.org/W1983523797","https://openalex.org/W2007734734","https://openalex.org/W2018135576","https://openalex.org/W2033030672","https://openalex.org/W2048687352","https://openalex.org/W2050838777","https://openalex.org/W2073591687","https://openalex.org/W2093831009","https://openalex.org/W2108776232","https://openalex.org/W2110040537","https://openalex.org/W2165501837","https://openalex.org/W2188644438","https://openalex.org/W2189990206","https://openalex.org/W2333120204","https://openalex.org/W2343090116","https://openalex.org/W2603090782","https://openalex.org/W2614992370","https://openalex.org/W2918343027","https://openalex.org/W2943517418","https://openalex.org/W2955358943","https://openalex.org/W2982838649","https://openalex.org/W2995409103","https://openalex.org/W3000451313","https://openalex.org/W3002038967","https://openalex.org/W3011116059","https://openalex.org/W3114263192","https://openalex.org/W3119186746","https://openalex.org/W3200299012","https://openalex.org/W3206104399","https://openalex.org/W4210556448","https://openalex.org/W4226053079","https://openalex.org/W4226154450","https://openalex.org/W4280590612","https://openalex.org/W4285411788","https://openalex.org/W4313476622","https://openalex.org/W4323519271","https://openalex.org/W4377224182","https://openalex.org/W4383112908","https://openalex.org/W4385732480","https://openalex.org/W4386449193","https://openalex.org/W4388579564","https://openalex.org/W4388726079","https://openalex.org/W4390724347","https://openalex.org/W6689723076"],"related_works":["https://openalex.org/W2056626217","https://openalex.org/W1541871911","https://openalex.org/W2184005427","https://openalex.org/W3185784018","https://openalex.org/W3212383242","https://openalex.org/W2050258033","https://openalex.org/W2148316232","https://openalex.org/W2118381768","https://openalex.org/W2981998189","https://openalex.org/W2085372279"],"abstract_inverted_index":{"This":[0,54],"paper":[1,232],"presents":[2],"an":[3,196],"online":[4,63,221],"transfer":[5,23,75],"heuristic":[6],"dynamic":[7,149],"programming":[8,150],"(THDP)":[9],"control":[10,34,64,97,198,222],"approach":[11,21],"for":[12,36],"a":[13,31,47,83,88,94,173,179,186,208],"class":[14,209],"of":[15,66,69,108,123,142,154,176,182,188,210,223],"nonlinear":[16,38,67,111],"discrete":[17,39],"systems.":[18],"The":[19],"proposed":[20,144],"integrates":[22],"learning":[24,207],"with":[25,87,200],"adaptive":[26],"critic":[27],"control.":[28],"To":[29,72],"design":[30],"robust":[32,114],"optimal":[33,115],"strategy":[35],"the":[37,62,106,109,120,140,143,155,160,220,228],"systems,":[40],"we":[41,81,92,103,194],"utilize":[42],"sample":[43],"data":[44],"collected":[45],"from":[46],"source":[48],"task":[49],"to":[50,60,99,138,147,158,213,217],"acquire":[51],"prior":[52,55,215],"knowledge.":[53],"knowledge":[56,216],"is":[57,152],"subsequently":[58],"used":[59],"guide":[61],"process":[65],"systems":[68,112],"target":[70],"tasks.":[71],"avoid":[73],"negative":[74],"effects":[76],"and":[77,178,243],"conserve":[78],"computational":[79,183,189],"resources,":[80],"introduce":[82],"novel":[84],"attenuation":[85],"function":[86],"truncation":[89],"mechanism.":[90],"Additionally,":[91],"develop":[93],"disturbance":[95],"compensation":[96],"mechanism":[98],"address":[100],"uncertainties.":[101],"Furthermore,":[102],"demonstrate":[104],"that":[105,204,238,252],"properties":[107],"uncertain":[110],"under":[113],"control,":[116],"as":[117,119],"well":[118],"weight":[121],"error":[122],"neural":[124,167],"networks,":[125],"are":[126,136,240],"ultimately":[127],"uniformly":[128],"bounded":[129],"given":[130],"certain":[131],"conditions.":[132],"Finally,":[133],"two":[134],"simulations":[135],"conducted":[137],"verify":[139],"performance":[141],"algorithm.":[145],"Note":[146],"Practitioners\u2014Adaptive":[148],"(ADP)":[151],"one":[153],"main":[156],"methods":[157],"solve":[159],"Hamilton-Jacobi-Bellman":[161],"(HJB)":[162],"equation.":[163],"However,":[164],"when":[165],"using":[166],"network":[168],"approximation,":[169],"it":[170,248],"often":[171],"requires":[172],"long":[174],"time":[175],"iteration":[177],"large":[180],"amount":[181],"process,":[184],"wasting":[185],"lot":[187],"resources.":[190],"For":[191],"this":[192,231,253],"reason,":[193],"propose":[195],"ADP":[197],"scheme":[199,254],"enhanced":[201],"detection":[202],"speed:":[203],"is,":[205],"by":[206],"similar":[211],"tasks":[212],"obtain":[214],"assist":[218],"in":[219],"our":[224],"actual":[225],"system.":[226],"At":[227],"same":[229],"time,":[230],"considers":[233],"system":[234],"disturbances,":[235],"which":[236],"means":[237],"they":[239],"more":[241],"universal":[242],"robust.":[244],"After":[245],"simulation":[246],"experiments,":[247],"has":[249,255],"been":[250],"proven":[251],"good":[256],"performance.":[257]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
