{"id":"https://openalex.org/W4388579581","doi":"https://doi.org/10.1109/tsmc.2023.3327450","title":"Adaptive Dynamic Programming for Optimal Control of Discrete-Time Nonlinear Systems With Trajectory-Based Initial Control Policy","display_name":"Adaptive Dynamic Programming for Optimal Control of Discrete-Time Nonlinear Systems With Trajectory-Based Initial Control Policy","publication_year":2023,"publication_date":"2023-11-10","ids":{"openalex":"https://openalex.org/W4388579581","doi":"https://doi.org/10.1109/tsmc.2023.3327450"},"language":"en","primary_location":{"id":"doi:10.1109/tsmc.2023.3327450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2023.3327450","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058905701","display_name":"Jiahui Xu","orcid":"https://orcid.org/0000-0002-4058-0447"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiahui Xu","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4058-0447","affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100777024","display_name":"Jingcheng Wang","orcid":"https://orcid.org/0000-0002-4277-1263"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingcheng Wang","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4277-1263","affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018604914","display_name":"Jun Rao","orcid":"https://orcid.org/0000-0002-7467-4898"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Rao","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-7467-4898","affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087893108","display_name":"Shunyu Wu","orcid":"https://orcid.org/0000-0001-9856-2148"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shunyu Wu","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-9856-2148","affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000872966","display_name":"Yanjiu Zhong","orcid":"https://orcid.org/0000-0002-4361-9378"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjiu Zhong","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4361-9378","affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":1.1023,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.81638155,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"54","issue":"3","first_page":"1489","last_page":"1501"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.982200026512146,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10675","display_name":"Mechanical Circulatory Support Devices","score":0.9672999978065491,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.66135174036026},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.6108092069625854},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.5881679058074951},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.577095091342926},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5581710338592529},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.5288482904434204},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5175082683563232},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5094276070594788},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.5004267692565918},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.46021807193756104},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4334830343723297},{"id":"https://openalex.org/keywords/discrete-time-and-continuous-time","display_name":"Discrete time and continuous time","score":0.42686280608177185},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.382876455783844},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.25113728642463684},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2033938467502594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19488295912742615},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13676020503044128}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.66135174036026},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.6108092069625854},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.5881679058074951},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.577095091342926},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5581710338592529},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.5288482904434204},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5175082683563232},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5094276070594788},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.5004267692565918},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.46021807193756104},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4334830343723297},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.42686280608177185},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.382876455783844},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25113728642463684},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2033938467502594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19488295912742615},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13676020503044128},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2023.3327450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2023.3327450","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4341435642","display_name":null,"funder_award_id":"62273234","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1588906117","https://openalex.org/W1707845830","https://openalex.org/W2056653303","https://openalex.org/W2141559645","https://openalex.org/W2568019971","https://openalex.org/W2802164917","https://openalex.org/W2891122218","https://openalex.org/W2944481182","https://openalex.org/W2996785115","https://openalex.org/W3008245684","https://openalex.org/W3010946901","https://openalex.org/W3036186095","https://openalex.org/W3037622062","https://openalex.org/W3111327451","https://openalex.org/W3124981469","https://openalex.org/W3153251967","https://openalex.org/W3162945727","https://openalex.org/W3163501229","https://openalex.org/W3196262453","https://openalex.org/W3196755144","https://openalex.org/W3196924932","https://openalex.org/W3197308516","https://openalex.org/W4214717370","https://openalex.org/W4254041323","https://openalex.org/W4280607589","https://openalex.org/W4285411788","https://openalex.org/W4292086994","https://openalex.org/W6631190155","https://openalex.org/W6631943919","https://openalex.org/W6727685206","https://openalex.org/W6734122017","https://openalex.org/W6748839928","https://openalex.org/W6788186211"],"related_works":["https://openalex.org/W1932159282","https://openalex.org/W4285537323","https://openalex.org/W2379312070","https://openalex.org/W2136173754","https://openalex.org/W2110050003","https://openalex.org/W2953025626","https://openalex.org/W2499081552","https://openalex.org/W2366053282","https://openalex.org/W1653644965","https://openalex.org/W2602009922"],"abstract_inverted_index":{"The":[0,96,145,157],"policy":[1,81,126,132,149],"gradient":[2],"adaptive":[3],"dynamic":[4],"programming":[5],"(PGADP)":[6],"technique":[7],"has":[8,71],"gained":[9],"recognition":[10],"as":[11,69],"an":[12,77,122,170],"effective":[13],"approach":[14,204],"for":[15,164,230],"optimizing":[16],"the":[17,39,42,87,105,109,114,137,142,160,165,176,187,203,214,220],"performance":[18,229],"of":[19,31,44,89,108,159,186,216,222],"nonlinear":[20,94,115,198,231],"systems.":[21,95,232],"Nonetheless,":[22],"existing":[23],"PGADP":[24,138,207],"algorithms":[25,49],"often":[26],"demand":[27],"a":[28,64,101,181],"substantial":[29],"volume":[30],"expensive":[32],"or":[33],"potentially":[34],"risky":[35],"interaction":[36],"data":[37],"with":[38],"system.":[40],"Moreover,":[41],"utilization":[43],"neural":[45],"networks":[46],"in":[47,52,92,154,218],"these":[48,62],"can":[50,150],"result":[51],"suboptimal":[53],"learning":[54,178],"efficiency":[55],"and":[56,168,183,192,208,225],"unstable":[57],"training":[58],"procedures.":[59],"To":[60],"address":[61],"challenges,":[63],"novel":[65],"algorithm,":[66],"referred":[67],"to":[68,85,140,174],"OptNet-PGADP,":[70],"been":[72],"introduced.":[73],"This":[74,131],"algorithm":[75,98,139,161,188],"integrates":[76,169],"initially":[78],"tailored":[79],"control":[80,90,118,125,148,228],"based":[82],"on":[83,196],"OptNet":[84,163],"tackle":[86],"optimization":[88],"problems":[91],"discrete-time":[93],"OptNet-PGADP":[97,217],"operates":[99],"through":[100,129],"two-step":[102],"process.":[103],"Initially,":[104],"input\u2013output":[106],"trajectory":[107],"system":[110],"is":[111,127,133,189],"computed":[112],"using":[113,136],"model":[116],"predictive":[117],"(NMPC)":[119],"method.":[120],"Subsequently,":[121],"initial":[123],"admissible":[124],"acquired":[128],"OptNet.":[130],"iteratively":[134],"enhanced":[135],"attain":[141],"optimal":[143],"controller.":[144],"resulting":[146],"closed-loop":[147],"be":[151],"readily":[152],"deployed":[153],"real-time":[155],"applications.":[156],"implementation":[158],"employs":[162],"actor":[166],"network":[167],"experience":[171],"replay":[172],"mechanism":[173],"bolster":[175],"controller\u2019s":[177],"efficiency.":[179],"Furthermore,":[180],"convergence":[182],"optimality":[184],"analysis":[185],"included.":[190],"Simulation":[191],"experimental":[193],"results":[194],"conducted":[195],"two":[197],"systems":[199],"conclusively":[200],"demonstrate":[201],"that":[202],"outperforms":[205],"traditional":[206],"NMPC":[209],"algorithms.":[210],"These":[211],"findings":[212],"underscore":[213],"efficacy":[215],"mitigating":[219],"constraints":[221],"current":[223],"methods":[224],"achieving":[226],"superior":[227]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
