{"id":"https://openalex.org/W2408978589","doi":"https://doi.org/10.1109/tnnls.2015.2442233","title":"Parallel Online Temporal Difference Learning for Motor Control","display_name":"Parallel Online Temporal Difference Learning for Motor Control","publication_year":2015,"publication_date":"2015-06-23","ids":{"openalex":"https://openalex.org/W2408978589","doi":"https://doi.org/10.1109/tnnls.2015.2442233","mag":"2408978589","pmid":"https://pubmed.ncbi.nlm.nih.gov/26111402"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2015.2442233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2015.2442233","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009958441","display_name":"Wouter Caarls","orcid":"https://orcid.org/0000-0001-9069-2378"},"institutions":[{"id":"https://openalex.org/I122140584","display_name":"Universidade Federal do Rio de Janeiro","ror":"https://ror.org/03490as77","country_code":"BR","type":"education","lineage":["https://openalex.org/I122140584"]},{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["BR","NL"],"is_corresponding":true,"raw_author_name":"Wouter Caarls","raw_affiliation_strings":["Departamento de Ci\u00eancia da Computa\u00e7\u00e3o/N\u00facleo de Computa\u00e7\u00e3o Eletr\u00f4nica, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil","Department of Biomechanical Engineering, Delft University of Technology, Delft, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Departamento de Ci\u00eancia da Computa\u00e7\u00e3o/N\u00facleo de Computa\u00e7\u00e3o Eletr\u00f4nica, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil","institution_ids":["https://openalex.org/I122140584"]},{"raw_affiliation_string":"Department of Biomechanical Engineering, Delft University of Technology, Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031675619","display_name":"E. Schuitema","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Erik Schuitema","raw_affiliation_strings":["Erik Schuitema Software Development, Delft, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Erik Schuitema Software Development, Delft, The Netherlands","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5009958441"],"corresponding_institution_ids":["https://openalex.org/I122140584","https://openalex.org/I98358874"],"apc_list":null,"apc_paid":null,"fwci":2.5886,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.91988745,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"27","issue":"7","first_page":"1457","last_page":"1468"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8904118537902832},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7365329265594482},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7092716693878174},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.6884549260139465},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6086015701293945},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5508140325546265},{"id":"https://openalex.org/keywords/temporal-difference-learning","display_name":"Temporal difference learning","score":0.5296958088874817},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4986753463745117},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.43058642745018005},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.41923388838768005},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3967358469963074},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1517539620399475},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.1049836277961731},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09039199352264404}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8904118537902832},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7365329265594482},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7092716693878174},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.6884549260139465},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6086015701293945},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5508140325546265},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.5296958088874817},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4986753463745117},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.43058642745018005},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.41923388838768005},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3967358469963074},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1517539620399475},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.1049836277961731},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09039199352264404},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2015.2442233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2015.2442233","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:26111402","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/26111402","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.4300000071525574}],"awards":[{"id":"https://openalex.org/G2998096948","display_name":null,"funder_award_id":"611909","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W166862392","https://openalex.org/W1491843047","https://openalex.org/W1550698229","https://openalex.org/W1597173708","https://openalex.org/W1626155273","https://openalex.org/W1689445748","https://openalex.org/W1758031947","https://openalex.org/W1966086707","https://openalex.org/W1970391951","https://openalex.org/W1980035368","https://openalex.org/W1982262386","https://openalex.org/W1984120922","https://openalex.org/W1984381895","https://openalex.org/W1993740947","https://openalex.org/W1994923984","https://openalex.org/W2038509324","https://openalex.org/W2043724035","https://openalex.org/W2046376809","https://openalex.org/W2048226872","https://openalex.org/W2085627234","https://openalex.org/W2091565802","https://openalex.org/W2097797606","https://openalex.org/W2100752967","https://openalex.org/W2103285838","https://openalex.org/W2117629901","https://openalex.org/W2120346334","https://openalex.org/W2121863487","https://openalex.org/W2124403132","https://openalex.org/W2124674171","https://openalex.org/W2127412976","https://openalex.org/W2129564505","https://openalex.org/W2130105540","https://openalex.org/W2132622533","https://openalex.org/W2135376858","https://openalex.org/W2140135625","https://openalex.org/W2151250975","https://openalex.org/W2151661095","https://openalex.org/W2152083440","https://openalex.org/W2153039919","https://openalex.org/W2154208977","https://openalex.org/W2160829351","https://openalex.org/W2167647761","https://openalex.org/W2168945912","https://openalex.org/W2272929109","https://openalex.org/W2427881153","https://openalex.org/W2965916140","https://openalex.org/W4211089519","https://openalex.org/W4214717370","https://openalex.org/W4245108548","https://openalex.org/W4245296547","https://openalex.org/W6638058698","https://openalex.org/W6677737365","https://openalex.org/W6679365036","https://openalex.org/W6680657880","https://openalex.org/W6682467750","https://openalex.org/W6996421775"],"related_works":["https://openalex.org/W4400868993","https://openalex.org/W2145363145","https://openalex.org/W2341346307","https://openalex.org/W2154399718","https://openalex.org/W2768629321","https://openalex.org/W4384574988","https://openalex.org/W2130711276","https://openalex.org/W4321463377","https://openalex.org/W4308828368","https://openalex.org/W1528400370"],"abstract_inverted_index":{"Temporal":[0],"difference":[1],"(TD)":[2],"learning,":[3,9],"a":[4,11,97,114,120,127,135,143],"key":[5],"concept":[6],"in":[7,20,28,69],"reinforcement":[8],"is":[10,25],"popular":[12],"method":[13,24],"for":[14],"solving":[15],"simulated":[16,110],"control":[17,108,111],"problems.":[18],"However,":[19],"real":[21,70],"systems,":[22],"this":[23,59],"often":[26],"avoided":[27],"favor":[29],"of":[30,35,52,99,103,129,139],"policy":[31,41,54,151],"search":[32,42],"methods":[33],"because":[34],"its":[36,45],"long":[37],"learning":[38,65,78,137],"time.":[39],"But":[40],"suffers":[43],"from":[44],"own":[46],"drawbacks,":[47],"such":[48],"as":[49,73],"the":[50],"necessity":[51],"informed":[53],"parameterization":[55],"and":[56,79,86,119],"initialization.":[57],"In":[58],"paper,":[60],"we":[61,94,125],"show":[62],"that":[63],"TD":[64,107],"can":[66,95],"work":[67],"effectively":[68],"robotic":[71],"systems":[72],"well,":[74],"using":[75],"parallel":[76],"model":[77],"planning.":[80],"Using":[81],"locally":[82],"weighted":[83],"linear":[84],"regression":[85],"trajectory":[87],"sampled":[88],"planning":[89],"with":[90,134,149],"14":[91],"concurrent":[92],"threads,":[93],"achieve":[96],"speedup":[98,128],"almost":[100],"two":[101],"orders":[102],"magnitude":[104],"over":[105],"regular":[106],"on":[109],"benchmarks.":[112],"For":[113],"real-world":[115],"pendulum":[116],"swing-up":[117],"task":[118],"two-link":[121],"manipulator":[122],"movement":[123],"task,":[124],"report":[126],"20\u00d7":[130],"to":[131],"60\u00d7":[132],",":[133],"real-time":[136],"speed":[138],"less":[140],"than":[141],"half":[142],"minute.":[144],"The":[145],"results":[146],"are":[147],"competitive":[148],"state-of-the-art":[150],"search.":[152]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
