{"id":"https://openalex.org/W3003393022","doi":"https://doi.org/10.1109/iros40897.2019.8968574","title":"Robotic Tracking Control with Kernel Trick-based Reinforcement Learning","display_name":"Robotic Tracking Control with Kernel Trick-based Reinforcement Learning","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W3003393022","doi":"https://doi.org/10.1109/iros40897.2019.8968574","mag":"3003393022"},"language":"en","primary_location":{"id":"doi:10.1109/iros40897.2019.8968574","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968574","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103000208","display_name":"Yazhou Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4391768281","display_name":"State Key Laboratory of Robotics","ror":"https://ror.org/03pcw1780","country_code":null,"type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]},{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yazhou Hu","raw_affiliation_strings":["Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115695520","display_name":"Wenxue Wang","orcid":"https://orcid.org/0000-0002-9137-8302"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4391768281","display_name":"State Key Laboratory of Robotics","ror":"https://ror.org/03pcw1780","country_code":null,"type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxue Wang","raw_affiliation_strings":["Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100458836","display_name":"Hao Liu","orcid":"https://orcid.org/0000-0002-7504-9859"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hao Liu","raw_affiliation_strings":["Georgia Institute of Technology,department of mathematics,Atlanta,GA,USA,30332","department of mathematics, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology,department of mathematics,Atlanta,GA,USA,30332","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"department of mathematics, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040326170","display_name":"Lianqing Liu","orcid":"https://orcid.org/0000-0002-2271-5870"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4391768281","display_name":"State Key Laboratory of Robotics","ror":"https://ror.org/03pcw1780","country_code":null,"type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianqing Liu","raw_affiliation_strings":["Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences,State Key Laboratory of Robotics,Shenyang,China,110016","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Institutes for Robotics and Intelligent Manufacturing, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103000208"],"corresponding_institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366","https://openalex.org/I4391768281"],"apc_list":null,"apc_paid":null,"fwci":0.1998,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.58956464,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"2019","issue":null,"first_page":"997","last_page":"1002"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9340000152587891,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9208769798278809},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7628591060638428},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6232248544692993},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6182423830032349},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.529569149017334},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.48877498507499695},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.43855857849121094},{"id":"https://openalex.org/keywords/control-system","display_name":"Control system","score":0.4190016984939575},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.41075536608695984},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3610690236091614},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3227235674858093},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15529564023017883},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06365877389907837}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9208769798278809},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7628591060638428},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6232248544692993},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6182423830032349},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.529569149017334},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.48877498507499695},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.43855857849121094},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.4190016984939575},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.41075536608695984},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3610690236091614},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3227235674858093},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15529564023017883},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06365877389907837},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros40897.2019.8968574","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968574","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"mag:3087231992","is_oa":false,"landing_page_url":"https://jglobal.jst.go.jp/en/detail?JGLOBAL_ID=202002227569376682","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W15601695","https://openalex.org/W639062186","https://openalex.org/W1493190793","https://openalex.org/W1550698229","https://openalex.org/W1983345526","https://openalex.org/W2008437088","https://openalex.org/W2079553629","https://openalex.org/W2086702027","https://openalex.org/W2092959905","https://openalex.org/W2101915445","https://openalex.org/W2103676119","https://openalex.org/W2121863487","https://openalex.org/W2128920470","https://openalex.org/W2140135625","https://openalex.org/W2168342951","https://openalex.org/W2181371911","https://openalex.org/W2294330364","https://openalex.org/W2336652059","https://openalex.org/W2346806992","https://openalex.org/W2407115150","https://openalex.org/W2484646121","https://openalex.org/W2580909119","https://openalex.org/W2586680856","https://openalex.org/W2620010368","https://openalex.org/W2762398554","https://openalex.org/W2765094417","https://openalex.org/W2771998355","https://openalex.org/W2787963636","https://openalex.org/W2797655438","https://openalex.org/W2798534591","https://openalex.org/W2804158892","https://openalex.org/W2808399740","https://openalex.org/W4239052068","https://openalex.org/W4245296547","https://openalex.org/W4285719527","https://openalex.org/W6600624752","https://openalex.org/W6679401659","https://openalex.org/W6680657880"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2121910908","https://openalex.org/W915438175"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"reinforcement":[3,27,86],"learning":[4,28,55,79,87],"has":[5,140],"been":[6],"developed":[7],"dramatically":[8],"and":[9,106,144,154],"is":[10,71,90,124,162],"widely":[11],"used":[12],"to":[13,29,42,58,75,92,111],"solve":[14],"control":[15,32,56,63,95,119,148],"problems,":[16],"e.g.,":[17],"playing":[18],"games.":[19],"However,":[20],"there":[21],"are":[22],"still":[23],"some":[24],"problems":[25],"for":[26],"perform":[30,93],"robotic":[31,61,99],"tasks.":[33,64],"Fortunately,":[34],"the":[35,78,104,108,113,117,128,131,133,151,155],"kernel":[36,53,84],"trick-based":[37,54,85],"methods":[38],"provide":[39],"a":[40,52,83,98,121],"chance":[41],"deal":[43],"with":[44,130],"those":[45],"challenges.":[46],"This":[47],"work":[48,161],"aims":[49],"at":[50],"developing":[51],"method":[57],"carry":[59],"out":[60],"tracking":[62,88,94,147],"A":[65],"reward":[66,109,152],"system,":[67],"in":[68,73,159],"this":[69,160],"work,":[70],"presented":[72,91],"order":[74],"speed":[76,114],"up":[77],"processes.":[80],"And":[81],"then,":[82],"controller":[89],"tasks":[96,149],"on":[97],"manipulator":[100],"system.":[101],"To":[102],"evaluate":[103],"policy":[105],"assist":[107],"system":[110,123,157],"accelerate":[112],"of":[115],"finding":[116],"optimal":[118],"policy,":[120],"critic":[122,156],"introduced.":[125],"Finally,":[126],"from":[127],"comparison":[129],"benchmark,":[132],"simulation":[134],"results":[135],"illustrate":[136],"that":[137],"our":[138],"algorithm":[139],"faster":[141],"convergence":[142],"rate":[143],"can":[145],"execute":[146],"effectively,":[150],"function":[153],"proposed":[158],"efficient.":[163]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
