{"id":"https://openalex.org/W4306963870","doi":"https://doi.org/10.3390/robotics11050116","title":"Trajectory Control of An Articulated Robot Based on Direct Reinforcement Learning","display_name":"Trajectory Control of An Articulated Robot Based on Direct Reinforcement Learning","publication_year":2022,"publication_date":"2022-10-20","ids":{"openalex":"https://openalex.org/W4306963870","doi":"https://doi.org/10.3390/robotics11050116"},"language":"en","primary_location":{"id":"doi:10.3390/robotics11050116","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050116","pdf_url":"https://www.mdpi.com/2218-6581/11/5/116/pdf?version=1666677072","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2218-6581/11/5/116/pdf?version=1666677072","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101239623","display_name":"Chia\u2010Hao Tsai","orcid":null},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chia-Hao Tsai","raw_affiliation_strings":["Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103188257","display_name":"Jun-Ji Lin","orcid":"https://orcid.org/0000-0002-5151-113X"},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jun-Ji Lin","raw_affiliation_strings":["Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038864857","display_name":"Teng-Feng Hsieh","orcid":null},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Teng-Feng Hsieh","raw_affiliation_strings":["Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National Taiwan University, No. 1, Sec. 4, Roosevelt Rd., Taipei 106216, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046013877","display_name":"Jia\u2010Yush Yen","orcid":"https://orcid.org/0000-0001-8795-9211"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jia-Yush Yen","raw_affiliation_strings":["Department of Mechanical Engineering, National Taiwan University of Science and Technology, No. 43, Sec. 4, Taipei 106335, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National Taiwan University of Science and Technology, No. 43, Sec. 4, Taipei 106335, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5046013877"],"corresponding_institution_ids":["https://openalex.org/I154864474"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":0.6894,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.75425804,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"11","issue":"5","first_page":"116","last_page":"116"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9772999882698059,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9671000242233276,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6999186277389526},{"id":"https://openalex.org/keywords/inverse-dynamics","display_name":"Inverse dynamics","score":0.6985343098640442},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6809202432632446},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.6226556301116943},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5904056429862976},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5804187059402466},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.5642058849334717},{"id":"https://openalex.org/keywords/inverse-kinematics","display_name":"Inverse kinematics","score":0.562038242816925},{"id":"https://openalex.org/keywords/model-predictive-control","display_name":"Model predictive control","score":0.5444723963737488},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5427042245864868},{"id":"https://openalex.org/keywords/torque","display_name":"Torque","score":0.4889615774154663},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.45005133748054504},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.4414587616920471},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43874597549438477},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.37206530570983887},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.25119662284851074},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.13501214981079102}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6999186277389526},{"id":"https://openalex.org/C187523126","wikidata":"https://www.wikidata.org/wiki/Q17098330","display_name":"Inverse dynamics","level":3,"score":0.6985343098640442},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6809202432632446},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.6226556301116943},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5904056429862976},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5804187059402466},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.5642058849334717},{"id":"https://openalex.org/C17816587","wikidata":"https://www.wikidata.org/wiki/Q1501872","display_name":"Inverse kinematics","level":3,"score":0.562038242816925},{"id":"https://openalex.org/C172205157","wikidata":"https://www.wikidata.org/wiki/Q1782962","display_name":"Model predictive control","level":3,"score":0.5444723963737488},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5427042245864868},{"id":"https://openalex.org/C144171764","wikidata":"https://www.wikidata.org/wiki/Q48103","display_name":"Torque","level":2,"score":0.4889615774154663},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.45005133748054504},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.4414587616920471},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43874597549438477},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.37206530570983887},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.25119662284851074},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.13501214981079102},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/robotics11050116","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050116","pdf_url":"https://www.mdpi.com/2218-6581/11/5/116/pdf?version=1666677072","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:9f58a328791d42988b3f0b65acdc2e37","is_oa":true,"landing_page_url":"https://doaj.org/article/9f58a328791d42988b3f0b65acdc2e37","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, Vol 11, Iss 5, p 116 (2022)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2218-6581/11/5/116/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/robotics11050116","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics; Volume 11; Issue 5; Pages: 116","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/robotics11050116","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics11050116","pdf_url":"https://www.mdpi.com/2218-6581/11/5/116/pdf?version=1666677072","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7099999785423279,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320331164","display_name":"National Science and Technology Council","ror":"https://ror.org/00wnb9798"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4306963870.pdf","grobid_xml":"https://content.openalex.org/works/W4306963870.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W139620917","https://openalex.org/W1973338532","https://openalex.org/W2025033535","https://openalex.org/W2073787051","https://openalex.org/W2079886367","https://openalex.org/W2087316754","https://openalex.org/W2093253120","https://openalex.org/W2106871887","https://openalex.org/W2109169869","https://openalex.org/W2124267516","https://openalex.org/W2127107099","https://openalex.org/W2173248099","https://openalex.org/W2511924737","https://openalex.org/W2553109721","https://openalex.org/W2575705757","https://openalex.org/W2593237273","https://openalex.org/W2596758708","https://openalex.org/W2621305136","https://openalex.org/W2743408048","https://openalex.org/W2746553466","https://openalex.org/W2791924686","https://openalex.org/W2808565671","https://openalex.org/W2885522997","https://openalex.org/W2896479405","https://openalex.org/W2903148528","https://openalex.org/W2909718913","https://openalex.org/W2909983946","https://openalex.org/W2947238547","https://openalex.org/W2951170679","https://openalex.org/W3044645263","https://openalex.org/W3083415411","https://openalex.org/W3093426589","https://openalex.org/W3119867786","https://openalex.org/W3138640436","https://openalex.org/W3156522175","https://openalex.org/W3205942598","https://openalex.org/W4237733001","https://openalex.org/W6684205842"],"related_works":["https://openalex.org/W1990079087","https://openalex.org/W2060165215","https://openalex.org/W2101188133","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3202234113","https://openalex.org/W4380318855","https://openalex.org/W4248731570","https://openalex.org/W2572731987","https://openalex.org/W2291700020"],"abstract_inverted_index":{"Reinforcement":[0],"Learning":[1],"(RL)":[2],"is":[3,43],"gaining":[4],"much":[5],"research":[6],"attention":[7],"because":[8],"it":[9,152,161],"allows":[10],"the":[11,18,26,36,47,64,79,98,118,125,129,144,157,168,171,176,180],"system":[12],"to":[13,62,90,96],"learn":[14,63],"from":[15],"interacting":[16],"with":[17,21,128],"environment.":[19],"Yet,":[20],"all":[22],"these":[23],"successful":[24,58,99],"applications,":[25],"application":[27],"of":[28,38,60,78,101],"RL":[29,61,126,172],"in":[30,46],"direct":[31,65],"joint":[32],"torque":[33,66],"control":[34,67,100,127,137],"without":[35,75,105],"help":[37],"an":[39,107],"underlining":[40],"dynamic":[41,80],"model":[42,110],"not":[44,154],"reported":[45],"literature.":[48],"This":[49],"study":[50],"presents":[51],"a":[52,71,86],"split":[53],"network":[54],"structure":[55],"that":[56,142],"enables":[57],"training":[59,84],"for":[68],"trajectory":[69,136],"following":[70],"six-axis":[72],"articulated":[73],"robot":[74,81],"prior":[76],"knowledge":[77],"model.":[82],"The":[83],"took":[85],"very":[87],"long":[88],"time":[89],"converge.":[91],"However,":[92],"we":[93,122],"were":[94],"able":[95],"show":[97,117,141],"four":[102],"different":[103],"trajectories":[104],"needing":[106],"accurate":[108,150],"dynamics":[109,165],"and":[111,148],"complex":[112,163],"inverse":[113,164],"kinematics":[114],"computation.":[115],"To":[116],"RL-based":[119],"control\u2019s":[120],"effectiveness,":[121],"also":[123],"compare":[124],"Model":[130],"Predictive":[131],"Control":[132],"(MPC),":[133],"another":[134],"popular":[135],"method.":[138],"Our":[139],"results":[140],"while":[143],"MPC":[145],"achieves":[146],"smoother":[147],"more":[149],"control,":[151],"does":[153],"automatically":[155],"treat":[156],"singularity.":[158],"In":[159],"addition,":[160],"requires":[162],"calculations.":[166],"On":[167],"other":[169],"hand,":[170],"controller":[173],"instinctively":[174],"avoided":[175],"violent":[177],"action":[178],"around":[179],"singularities.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2022-10-21T00:00:00"}
