{"id":"https://openalex.org/W3203990188","doi":"https://doi.org/10.1109/tsmc.2021.3112688","title":"Optimized Backstepping Tracking Control Using Reinforcement Learning for Quadrotor Unmanned Aerial Vehicle System","display_name":"Optimized Backstepping Tracking Control Using Reinforcement Learning for Quadrotor Unmanned Aerial Vehicle System","publication_year":2021,"publication_date":"2021-09-23","ids":{"openalex":"https://openalex.org/W3203990188","doi":"https://doi.org/10.1109/tsmc.2021.3112688","mag":"3203990188"},"language":"en","primary_location":{"id":"doi:10.1109/tsmc.2021.3112688","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2021.3112688","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063205336","display_name":"Guoxing Wen","orcid":"https://orcid.org/0000-0002-6392-5989"},"institutions":[{"id":"https://openalex.org/I151013683","display_name":"Binzhou University","ror":"https://ror.org/05frpfj73","country_code":"CN","type":"education","lineage":["https://openalex.org/I151013683"]},{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guoxing Wen","raw_affiliation_strings":["College of Science, Binzhou University, Binzhou, China","School of Mathematics and Statistics, Qilu University of Technology, Jinan, China"],"affiliations":[{"raw_affiliation_string":"College of Science, Binzhou University, Binzhou, China","institution_ids":["https://openalex.org/I151013683"]},{"raw_affiliation_string":"School of Mathematics and Statistics, Qilu University of Technology, Jinan, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061544952","display_name":"Wei Hao","orcid":"https://orcid.org/0000-0003-0071-5084"},"institutions":[{"id":"https://openalex.org/I151013683","display_name":"Binzhou University","ror":"https://ror.org/05frpfj73","country_code":"CN","type":"education","lineage":["https://openalex.org/I151013683"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Hao","raw_affiliation_strings":["Flight College, Binzhou University, Binzhou, China"],"affiliations":[{"raw_affiliation_string":"Flight College, Binzhou University, Binzhou, China","institution_ids":["https://openalex.org/I151013683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102201818","display_name":"Weiwei Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I151013683","display_name":"Binzhou University","ror":"https://ror.org/05frpfj73","country_code":"CN","type":"education","lineage":["https://openalex.org/I151013683"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiwei Feng","raw_affiliation_strings":["College of Aeronautical Engineering and the Shandong Engineering Research Center of Aeronautical Materials and Devices, Binzhou University, Binzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Aeronautical Engineering and the Shandong Engineering Research Center of Aeronautical Materials and Devices, Binzhou University, Binzhou, China","institution_ids":["https://openalex.org/I151013683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082236615","display_name":"Kaizhou Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I111950717","display_name":"Macau University of Science and Technology","ror":"https://ror.org/03jqs2n27","country_code":"MO","type":"education","lineage":["https://openalex.org/I111950717","https://openalex.org/I4391767947"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Kaizhou Gao","raw_affiliation_strings":["Institute of Systems Engineering, Macau University of Science and Technology, Macau, China"],"affiliations":[{"raw_affiliation_string":"Institute of Systems Engineering, Macau University of Science and Technology, Macau, China","institution_ids":["https://openalex.org/I111950717"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5063205336"],"corresponding_institution_ids":["https://openalex.org/I151013683","https://openalex.org/I152269853"],"apc_list":null,"apc_paid":null,"fwci":9.3498,"has_fulltext":false,"cited_by_count":112,"citation_normalized_percentile":{"value":0.98331001,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"52","issue":"8","first_page":"5004","last_page":"5015"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9699000120162964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/backstepping","display_name":"Backstepping","score":0.8931950330734253},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7360294461250305},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.658542275428772},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5547258257865906},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.47348225116729736},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.46082010865211487},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4433594048023224},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40714994072914124},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.32292476296424866},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.16065776348114014},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.06739136576652527}],"concepts":[{"id":"https://openalex.org/C72218879","wikidata":"https://www.wikidata.org/wiki/Q4839759","display_name":"Backstepping","level":4,"score":0.8931950330734253},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7360294461250305},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.658542275428772},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5547258257865906},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.47348225116729736},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.46082010865211487},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4433594048023224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40714994072914124},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.32292476296424866},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.16065776348114014},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.06739136576652527},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2021.3112688","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2021.3112688","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1036860860","display_name":null,"funder_award_id":"ZR2019PF021","funder_id":"https://openalex.org/F4320324174","funder_display_name":"Natural Science Foundation of Shandong Province"},{"id":"https://openalex.org/G2441221401","display_name":null,"funder_award_id":"61603169","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5969645192","display_name":null,"funder_award_id":"62103060","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5971077570","display_name":null,"funder_award_id":"ZR2018MF015","funder_id":"https://openalex.org/F4320324174","funder_display_name":"Natural Science Foundation of Shandong Province"},{"id":"https://openalex.org/G741060987","display_name":null,"funder_award_id":"62173356","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8866375341","display_name":null,"funder_award_id":"62073045","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324174","display_name":"Natural Science Foundation of Shandong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1983523797","https://openalex.org/W1998484460","https://openalex.org/W2025004307","https://openalex.org/W2069882558","https://openalex.org/W2080640384","https://openalex.org/W2082856443","https://openalex.org/W2093597151","https://openalex.org/W2104843094","https://openalex.org/W2109920799","https://openalex.org/W2125525186","https://openalex.org/W2134069001","https://openalex.org/W2137570966","https://openalex.org/W2141209752","https://openalex.org/W2157351539","https://openalex.org/W2161908285","https://openalex.org/W2165314520","https://openalex.org/W2167229184","https://openalex.org/W2167287735","https://openalex.org/W2168191426","https://openalex.org/W2231576311","https://openalex.org/W2245289424","https://openalex.org/W2262108890","https://openalex.org/W2546583797","https://openalex.org/W2780814805","https://openalex.org/W2787890633","https://openalex.org/W2887519063","https://openalex.org/W2888959292","https://openalex.org/W2912259603","https://openalex.org/W2981246288","https://openalex.org/W2998437857","https://openalex.org/W3003040443","https://openalex.org/W3041284915","https://openalex.org/W3083270461","https://openalex.org/W3124444594","https://openalex.org/W3195761866"],"related_works":["https://openalex.org/W2771027241","https://openalex.org/W1765905465","https://openalex.org/W2793080664","https://openalex.org/W2186140227","https://openalex.org/W2534185822","https://openalex.org/W2132535444","https://openalex.org/W2170944339","https://openalex.org/W2477888563","https://openalex.org/W1972061147","https://openalex.org/W3167722269"],"abstract_inverted_index":{"In":[0,72],"this":[1],"article,":[2],"an":[3,162,170],"optimized":[4,103,124,188],"tracking":[5,104],"control":[6,61,70,157,164,190],"scheme":[7,105],"is":[8,44,57,66,77,106,131,158,169,178],"studied":[9],"for":[10,58,67],"the":[11,25,33,38,55,60,64,69,88,102,115,122,129,134,137,143,155,166,174,184,187,199],"quadrotor":[12],"unmanned":[13],"aerial":[14],"vehicle":[15],"(QUAV)":[16],"system":[17,76],"by":[18,87,147,160,203],"combining":[19],"both":[20,48],"reinforcement":[21],"learning":[22],"(RL)":[23],"and":[24,42,50,63,90,117,126,208],"backstepping":[26],"technique.":[27],"The":[28],"RL":[29,130,176],"aims":[30],"to":[31,114],"overcome":[32],"difficulty":[34],"coming":[35],"from":[36],"solving":[37],"Hamilton\u2013Jacobi\u2013Bellman":[39],"(HJB)":[40],"equation,":[41],"it":[43],"performed":[45],"via":[46,97],"iterating":[47],"critic":[49,56],"actor":[51,65],"each":[52],"other,":[53],"where":[54],"improving":[59],"performance":[62],"executing":[68],"behavior.":[71],"mathematics,":[73],"a":[74,98,204,209],"QUAV":[75,189],"composed":[78,107],"of":[79,108,136,142],"two":[80,109,123],"connected":[81],"subsystems":[82],"that":[83],"are,":[84],"respectively,":[85],"modeled":[86],"translational":[89,167],"rotational":[91],"dynamic":[92,168],"equations,":[93],"which":[94],"are":[95,201],"coupled":[96],"rotation":[99],"matrix;":[100],"hence,":[101],"interconnected":[110],"individual":[111],"controls":[112],"corresponding":[113],"position":[116,125,156],"attitude,":[118],"respectively.":[119],"To":[120],"achieve":[121],"attitude":[127],"controls,":[128],"constructed":[132],"on":[133],"basis":[135],"neural":[138],"network":[139],"(NN)":[140],"approximation":[141,152],"HJB":[144],"equation\u2019s":[145],"solution":[146],"utilizing":[148],"NN\u2019s":[149],"outstanding":[150],"function":[151],"ability.":[153],"Particularly,":[154],"accomplished":[159],"introducing":[161],"intermediate":[163],"because":[165],"underactuated":[171],"system.":[172],"Since":[173],"proposed":[175],"algorithm":[177],"significantly":[179],"simple":[180],"in":[181,195],"comparison":[182],"with":[183],"published":[185],"methods,":[186],"can":[191],"be":[192],"easily":[193],"executed":[194],"practical":[196],"applications.":[197],"Finally,":[198],"results":[200],"demonstrated":[202],"Lyapunov":[205],"stability":[206],"analysis":[207],"numerical":[210],"simulation.":[211]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":44},{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":8}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
