{"id":"https://openalex.org/W3028234952","doi":"https://doi.org/10.1109/cis-ram47153.2019.9095802","title":"Trajectory-Tracking Control of Robotic Systems via Deep Reinforcement Learning","display_name":"Trajectory-Tracking Control of Robotic Systems via Deep Reinforcement Learning","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W3028234952","doi":"https://doi.org/10.1109/cis-ram47153.2019.9095802","mag":"3028234952"},"language":"en","primary_location":{"id":"doi:10.1109/cis-ram47153.2019.9095802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cis-ram47153.2019.9095802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Cybernetics and Intelligent Systems (CIS) and IEEE Conference on Robotics, Automation and Mechatronics (RAM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070751669","display_name":"Shansi Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Shansi Zhang","raw_affiliation_strings":["School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057396057","display_name":"Chao Sun","orcid":"https://orcid.org/0000-0002-9902-1623"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Chao Sun","raw_affiliation_strings":["School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048169356","display_name":"Zhi Feng","orcid":"https://orcid.org/0000-0002-1301-7739"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhi Feng","raw_affiliation_strings":["School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050664552","display_name":"Guoqiang Hu","orcid":"https://orcid.org/0000-0002-8618-5581"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Guoqiang Hu","raw_affiliation_strings":["School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Electronic Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5070751669"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":0.7001,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.79163966,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"386","last_page":"391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8281158804893494},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.7314905524253845},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.644644021987915},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.616638720035553},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6165920495986938},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3479098081588745},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.05349546670913696},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.04993999004364014}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8281158804893494},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.7314905524253845},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.644644021987915},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.616638720035553},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6165920495986938},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3479098081588745},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.05349546670913696},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.04993999004364014},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cis-ram47153.2019.9095802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cis-ram47153.2019.9095802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Cybernetics and Intelligent Systems (CIS) and IEEE Conference on Robotics, Automation and Mechatronics (RAM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1658008008","https://openalex.org/W1757796397","https://openalex.org/W2145339207","https://openalex.org/W2155968351","https://openalex.org/W2165150801","https://openalex.org/W2173564293","https://openalex.org/W2201581102","https://openalex.org/W2298546714","https://openalex.org/W2746553466","https://openalex.org/W2761873684","https://openalex.org/W2786928559","https://openalex.org/W2885163910","https://openalex.org/W2951799221","https://openalex.org/W2963428623","https://openalex.org/W2963477884","https://openalex.org/W2963864421","https://openalex.org/W2964043796","https://openalex.org/W2964291307","https://openalex.org/W2990747716","https://openalex.org/W3104515094","https://openalex.org/W4298857966","https://openalex.org/W4302570325","https://openalex.org/W6636881020","https://openalex.org/W6637967152","https://openalex.org/W6684205842","https://openalex.org/W6684921986","https://openalex.org/W6685444567","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6748554570","https://openalex.org/W6891797237"],"related_works":["https://openalex.org/W2542256560","https://openalex.org/W1543936162","https://openalex.org/W1971776229","https://openalex.org/W1578117154","https://openalex.org/W1971151","https://openalex.org/W2914830601","https://openalex.org/W2766961550","https://openalex.org/W2112263445","https://openalex.org/W1497101000","https://openalex.org/W2054235656"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"the":[3,69,76,85,95,101,105,115,120,128,132,136],"trajectory":[4,107],"tracking":[5,146],"problems":[6],"for":[7,37,68],"a":[8,12],"robotic":[9],"manipulator":[10],"and":[11,65,72,81,117,143],"mobile":[13],"robot":[14],"by":[15,135],"using":[16],"deep":[17,24],"reinforcement":[18,25],"learning":[19,26],"based":[20,28],"methods.":[21,122],"A":[22,53],"medel-free":[23],"method":[27],"on":[29],"Deep":[30],"Deter-ministic":[31],"Policy":[32],"Gradient":[33],"(DDPG)":[34],"is":[35,43,59],"designed":[36],"training.":[38],"The":[39],"priority":[40],"replay":[41],"memory":[42],"adopted":[44],"to":[45,93,113],"sample":[46],"more":[47],"significant":[48],"transitions":[49,64],"at":[50],"each":[51],"update.":[52],"distributed":[54,138],"framework":[55],"with":[56,78],"multiple":[57],"workers":[58,62,74],"proposed.":[60],"Synchronous":[61],"generate":[63],"compute":[66],"gradients":[67],"global":[70],"network,":[71],"collecting":[73],"explore":[75],"environment":[77],"different":[79],"policies":[80],"exploration":[82,96],"noises.":[83],"During":[84],"training,":[86],"we":[87],"adopt":[88],"random":[89],"reference":[90,106],"state":[91],"initialization":[92],"solve":[94],"problem,":[97],"which":[98],"can":[99,124],"make":[100],"robots":[102],"learn":[103,141],"from":[104,127],"effectively.":[108],"Numerical":[109],"simulations":[110],"are":[111],"provided":[112],"demonstrate":[114],"effectiveness":[116],"efficiency":[118],"of":[119],"proposed":[121,137],"It":[123],"be":[125],"seen":[126],"simulation":[129],"results":[130],"that":[131],"agent":[133],"trained":[134],"DDPG":[139],"could":[140],"faster":[142],"achieve":[144],"smaller":[145],"errors":[147],"than":[148],"DDPG.":[149]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
