{"id":"https://openalex.org/W4312567063","doi":"https://doi.org/10.1109/tnnls.2022.3225090","title":"Policy-Iteration-Based Finite-Horizon Approximate Dynamic Programming for Continuous-Time Nonlinear Optimal Control","display_name":"Policy-Iteration-Based Finite-Horizon Approximate Dynamic Programming for Continuous-Time Nonlinear Optimal Control","publication_year":2022,"publication_date":"2022-12-05","ids":{"openalex":"https://openalex.org/W4312567063","doi":"https://doi.org/10.1109/tnnls.2022.3225090","pmid":"https://pubmed.ncbi.nlm.nih.gov/37015565"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2022.3225090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3225090","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037283185","display_name":"Ziyu Lin","orcid":"https://orcid.org/0000-0003-0532-0030"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ziyu Lin","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0532-0030","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067909017","display_name":"Jingliang Duan","orcid":"https://orcid.org/0000-0002-3697-1576"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingliang Duan","raw_affiliation_strings":["School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3697-1576","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747108","display_name":"Shengbo Eben Li","orcid":"https://orcid.org/0000-0003-4923-3633"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengbo Eben Li","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4923-3633","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004124678","display_name":"Haitong Ma","orcid":"https://orcid.org/0000-0002-9943-0638"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haitong Ma","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9943-0638","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100696317","display_name":"Jie Li","orcid":"https://orcid.org/0000-0002-3718-5593"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3718-5593","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072222039","display_name":"Jianyu Chen","orcid":"https://orcid.org/0000-0003-0282-8621"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianyu Chen","raw_affiliation_strings":["Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0282-8621","affiliations":[{"raw_affiliation_string":"Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102489731","display_name":"Bo Cheng","orcid":"https://orcid.org/0000-0001-8921-5857"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Cheng","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053340150","display_name":"Jun Ma","orcid":"https://orcid.org/0000-0002-9405-8232"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jun Ma","raw_affiliation_strings":["Robotics and Autonomous Systems Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","Department of Electronic and Computer Engineering, The Hong Kong University of Science and Technology, Hong Kong SAR, China"],"raw_orcid":"https://orcid.org/0000-0002-9405-8232","affiliations":[{"raw_affiliation_string":"Robotics and Autonomous Systems Thrust, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]},{"raw_affiliation_string":"Department of Electronic and Computer Engineering, The Hong Kong University of Science and Technology, Hong Kong SAR, China","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5037283185"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":2.7429,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.91647493,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"34","issue":"9","first_page":"5255","last_page":"5267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10675","display_name":"Mechanical Circulatory Support Devices","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9751999974250793,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hamilton\u2013jacobi\u2013bellman-equation","display_name":"Hamilton\u2013Jacobi\u2013Bellman equation","score":0.9498330354690552},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.7417708039283752},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.6598119735717773},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.621330201625824},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5480709671974182},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5410020351409912},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.5312732458114624},{"id":"https://openalex.org/keywords/linear-quadratic-regulator","display_name":"Linear-quadratic regulator","score":0.48796290159225464},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.44421887397766113},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4436613917350769},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4327653646469116},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4127340316772461},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3316909074783325},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.19980919361114502},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.07370749115943909}],"concepts":[{"id":"https://openalex.org/C196978813","wikidata":"https://www.wikidata.org/wiki/Q3302775","display_name":"Hamilton\u2013Jacobi\u2013Bellman equation","level":3,"score":0.9498330354690552},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.7417708039283752},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.6598119735717773},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.621330201625824},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5480709671974182},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5410020351409912},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.5312732458114624},{"id":"https://openalex.org/C98779006","wikidata":"https://www.wikidata.org/wiki/Q2520550","display_name":"Linear-quadratic regulator","level":3,"score":0.48796290159225464},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.44421887397766113},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4436613917350769},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4327653646469116},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4127340316772461},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3316909074783325},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.19980919361114502},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.07370749115943909},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2022.3225090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3225090","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37015565","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37015565","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-124375","is_oa":false,"landing_page_url":"http://gateway.isiknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcAuth=LinksAMR&SrcApp=PARTNER_APP&DestLinkType=FullRecord&DestApp=WOS&KeyUT=000912844100001","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G166390454","display_name":null,"funder_award_id":"U20A20334","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3945676288","display_name":null,"funder_award_id":"52202487","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G76702134","display_name":null,"funder_award_id":"51575293","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W1540245649","https://openalex.org/W1964565648","https://openalex.org/W1965512034","https://openalex.org/W1965640670","https://openalex.org/W1977671496","https://openalex.org/W1983523797","https://openalex.org/W1986611918","https://openalex.org/W2024303516","https://openalex.org/W2057484415","https://openalex.org/W2098432798","https://openalex.org/W2108286682","https://openalex.org/W2111752439","https://openalex.org/W2114424860","https://openalex.org/W2142620596","https://openalex.org/W2154868061","https://openalex.org/W2316022697","https://openalex.org/W2484646121","https://openalex.org/W2487144912","https://openalex.org/W2570494446","https://openalex.org/W2593476633","https://openalex.org/W2605603065","https://openalex.org/W2790434033","https://openalex.org/W2842089854","https://openalex.org/W2899748887","https://openalex.org/W2899790086","https://openalex.org/W2919115771","https://openalex.org/W2921905705","https://openalex.org/W2924607344","https://openalex.org/W2942684165","https://openalex.org/W2943141190","https://openalex.org/W2959078751","https://openalex.org/W2964043796","https://openalex.org/W2972670442","https://openalex.org/W3003788156","https://openalex.org/W3044587771","https://openalex.org/W3110685645","https://openalex.org/W3126145082","https://openalex.org/W3127275112","https://openalex.org/W3131282584","https://openalex.org/W3171595030","https://openalex.org/W3193478200","https://openalex.org/W3213472335","https://openalex.org/W4205834900","https://openalex.org/W4206351770","https://openalex.org/W4225390809","https://openalex.org/W4239477580","https://openalex.org/W4287617987","https://openalex.org/W4362650413","https://openalex.org/W6692846177","https://openalex.org/W6756001544","https://openalex.org/W6767818127","https://openalex.org/W6804409665","https://openalex.org/W6810657268"],"related_works":["https://openalex.org/W4239477580","https://openalex.org/W4255265352","https://openalex.org/W2921905705","https://openalex.org/W1632524629","https://openalex.org/W4292330635","https://openalex.org/W2902017027","https://openalex.org/W2766998270","https://openalex.org/W2950982235","https://openalex.org/W2052286527","https://openalex.org/W4306892756"],"abstract_inverted_index":{"The":[0],"Hamilton-Jacobi-Bellman":[1],"(HJB)":[2],"equation":[3,36],"serves":[4],"as":[5,53],"the":[6,12,16,25,29,32,43,48,66,69,74,82,85,92,101,118,132,140,143,159,162],"necessary":[7],"and":[8,73,78,127,155,181],"sufficient":[9],"condition":[10],"for":[11,147],"optimal":[13,19],"solution":[14],"to":[15,90],"continuous-time":[17],"(CT)":[18],"control":[20],"problem":[21,180],"(OCP).":[22],"Compared":[23],"with":[24,131],"infinite-horizon":[26],"HJB":[27,35],"equation,":[28],"solving":[30],"of":[31,47,84,125,134,161,171],"finite-horizon":[33],"(FH)":[34],"has":[37],"been":[38],"a":[39,169,175,182],"long-standing":[40],"challenge,":[41],"because":[42],"partial":[44,70],"time":[45,71],"derivative":[46,72],"value":[49],"function":[50],"is":[51,108,115,145,165],"involved":[52],"an":[54,111],"additional":[55],"unknown":[56],"term.":[57],"To":[58],"address":[59],"this":[60,62,98],"problem,":[61],"study":[63],"first-time":[64],"bridges":[65],"link":[67],"between":[68],"terminal-time":[75],"utility":[76],"function,":[77],"thus":[79],"it":[80],"facilitates":[81],"use":[83,133],"policy":[86],"iteration":[87],"(PI)":[88],"technique":[89],"solve":[91],"CT":[93,148],"FH":[94,102,149],"OCPs.":[95],"Based":[96],"on":[97,173],"key":[99],"finding,":[100],"approximate":[103],"dynamic":[104],"programming":[105],"(ADP)":[106],"algorithm":[107,119,144,164],"proposed":[109,163],"leveraging":[110],"actor-critic":[112,141],"framework.":[113],"It":[114],"shown":[116],"that":[117],"exhibits":[120],"important":[121],"properties":[122],"in":[123,139],"terms":[124],"convergence":[126],"optimality.":[128],"Rather":[129],"importantly,":[130],"multilayer":[135],"neural":[136],"networks":[137],"(NNs)":[138],"architecture,":[142],"suitable":[146],"OCPs":[150],"toward":[151],"more":[152],"general":[153],"nonlinear":[154,183],"complex":[156],"systems.":[157],"Finally,":[158],"effectiveness":[160],"demonstrated":[166],"by":[167],"conducting":[168],"series":[170],"simulations":[172],"both":[174],"linear":[176],"quadratic":[177],"regulator":[178],"(LQR)":[179],"vehicle":[184],"tracking":[185],"problem.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-05-02T08:42:23.175194","created_date":"2025-10-10T00:00:00"}
