{"id":"https://openalex.org/W4313562991","doi":"https://doi.org/10.1109/humanoids53995.2022.10000148","title":"Adapting Object-Centric Probabilistic Movement Primitives with Residual Reinforcement Learning","display_name":"Adapting Object-Centric Probabilistic Movement Primitives with Residual Reinforcement Learning","publication_year":2022,"publication_date":"2022-11-28","ids":{"openalex":"https://openalex.org/W4313562991","doi":"https://doi.org/10.1109/humanoids53995.2022.10000148"},"language":"en","primary_location":{"id":"doi:10.1109/humanoids53995.2022.10000148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids53995.2022.10000148","pdf_url":null,"source":{"id":"https://openalex.org/S4363608580","display_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053233736","display_name":"J. Frederico Carvalho","orcid":"https://orcid.org/0000-0002-8750-0897"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]}],"countries":["DE","FR"],"is_corresponding":true,"raw_author_name":"Joao Carvalho","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems"],"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]},{"raw_affiliation_string":"Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063353075","display_name":"Dorothea Koert","orcid":"https://orcid.org/0000-0002-3571-6848"},"institutions":[{"id":"https://openalex.org/I4210122262","display_name":"Institut des Sciences Cognitives Marc Jeannerod","ror":"https://ror.org/02he5dz58","country_code":"FR","type":"facility","lineage":["https://openalex.org/I100532134","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I203339264","https://openalex.org/I4210096427","https://openalex.org/I4210122262"]},{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]},{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE","FR"],"is_corresponding":false,"raw_author_name":"Dorothea Koert","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","TUDa Centre for Cognitive Science","Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems"],"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]},{"raw_affiliation_string":"TUDa Centre for Cognitive Science","institution_ids":["https://openalex.org/I4210122262"]},{"raw_affiliation_string":"Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008668331","display_name":"Marek Daniv","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]}],"countries":["DE","FR"],"is_corresponding":false,"raw_author_name":"Marek Daniv","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems"],"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]},{"raw_affiliation_string":"Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071367253","display_name":"Jan Peters","orcid":"https://orcid.org/0000-0002-5266-8091"},"institutions":[{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"funder","lineage":["https://openalex.org/I33256026"]},{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I4210122262","display_name":"Institut des Sciences Cognitives Marc Jeannerod","ror":"https://ror.org/02he5dz58","country_code":"FR","type":"facility","lineage":["https://openalex.org/I100532134","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I203339264","https://openalex.org/I4210096427","https://openalex.org/I4210122262"]},{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]},{"id":"https://openalex.org/I16718484","display_name":"Hess (United States)","ror":"https://ror.org/00zbk1w77","country_code":"US","type":"company","lineage":["https://openalex.org/I16718484"]}],"countries":["DE","FR","US"],"is_corresponding":false,"raw_author_name":"Jan Peters","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","TUDa Centre for Cognitive Science","Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems","Research Department: Systems AI for Robot Learning, German Research Center for AI (DFKI)","Hessian. AI"],"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,TU Darmstadt (TUDa),Computer Science Department","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]},{"raw_affiliation_string":"TUDa Centre for Cognitive Science","institution_ids":["https://openalex.org/I4210122262"]},{"raw_affiliation_string":"Computer Science Department, TU Darmstadt (TUDa), Institute for Intelligent Autonomous Systems","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I31512782"]},{"raw_affiliation_string":"Research Department: Systems AI for Robot Learning, German Research Center for AI (DFKI)","institution_ids":["https://openalex.org/I33256026"]},{"raw_affiliation_string":"Hessian. AI","institution_ids":["https://openalex.org/I16718484"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053233736"],"corresponding_institution_ids":["https://openalex.org/I31512782","https://openalex.org/I4210156583"],"apc_list":null,"apc_paid":null,"fwci":1.4109,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.8270216,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"405","last_page":"412"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9696000218391418,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7903835773468018},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7264487147331238},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6997501850128174},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6918687224388123},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6798825263977051},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6510556936264038},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5791944861412048},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5364521145820618},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5327228307723999},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.45647767186164856},{"id":"https://openalex.org/keywords/cartesian-coordinate-system","display_name":"Cartesian coordinate system","score":0.45239678025245667},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.44529396295547485},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.4177165627479553},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.332388311624527},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1309441328048706}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7903835773468018},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7264487147331238},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6997501850128174},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6918687224388123},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6798825263977051},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6510556936264038},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5791944861412048},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5364521145820618},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5327228307723999},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.45647767186164856},{"id":"https://openalex.org/C16038011","wikidata":"https://www.wikidata.org/wiki/Q62912","display_name":"Cartesian coordinate system","level":2,"score":0.45239678025245667},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.44529396295547485},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.4177165627479553},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.332388311624527},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1309441328048706},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/humanoids53995.2022.10000148","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids53995.2022.10000148","pdf_url":null,"source":{"id":"https://openalex.org/S4363608580","display_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.5099999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W2012392077","https://openalex.org/W2128677288","https://openalex.org/W2131666656","https://openalex.org/W2136719407","https://openalex.org/W2155027007","https://openalex.org/W2156321584","https://openalex.org/W2172968643","https://openalex.org/W2528951757","https://openalex.org/W2604272474","https://openalex.org/W2735021678","https://openalex.org/W2913668833","https://openalex.org/W2958441538","https://openalex.org/W2964319110","https://openalex.org/W2967727187","https://openalex.org/W2970377754","https://openalex.org/W2998544442","https://openalex.org/W3003629310","https://openalex.org/W3009632987","https://openalex.org/W3017212538","https://openalex.org/W3028308378","https://openalex.org/W3081200565","https://openalex.org/W3091552533","https://openalex.org/W3100172161","https://openalex.org/W3101875589","https://openalex.org/W3127352841","https://openalex.org/W3130717831","https://openalex.org/W3132045372","https://openalex.org/W3134091418","https://openalex.org/W3155877522","https://openalex.org/W3159735414","https://openalex.org/W3166834117","https://openalex.org/W3171801597","https://openalex.org/W3197400104","https://openalex.org/W3201276701","https://openalex.org/W3205745479","https://openalex.org/W3216933777","https://openalex.org/W4211008118","https://openalex.org/W4286891162","https://openalex.org/W4289115845","https://openalex.org/W4300568640","https://openalex.org/W4308538573","https://openalex.org/W6631190155","https://openalex.org/W6640963894","https://openalex.org/W6680971464","https://openalex.org/W6683001934","https://openalex.org/W6683204974","https://openalex.org/W6747473740","https://openalex.org/W6748839928","https://openalex.org/W6756848961","https://openalex.org/W6764969207","https://openalex.org/W6765008394","https://openalex.org/W6785022314","https://openalex.org/W6796992754","https://openalex.org/W6803241323","https://openalex.org/W6804806280","https://openalex.org/W6807335531"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2560215812","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W2949601986","https://openalex.org/W4323768008","https://openalex.org/W1941703695","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090"],"abstract_inverted_index":{"It":[0],"is":[1,60],"desirable":[2],"for":[3,96,138],"future":[4],"robots":[5],"to":[6,15,28,33,84,94,133,171],"quickly":[7],"learn":[8,34,109],"new":[9],"tasks":[10],"and":[11,75,101,122],"adapt":[12],"learned":[13,68],"skills":[14],"constantly":[16],"changing":[17],"environments.":[18],"To":[19],"this":[20],"end,":[21],"Probabilistic":[22],"Movement":[23],"Primitives":[24],"(ProMPs)":[25],"have":[26],"shown":[27],"be":[29],"a":[30,110,115,130,141,151,157],"promising":[31],"framework":[32],"generalizable":[35],"trajectory":[36,118],"generators":[37],"from":[38,72],"distributions":[39],"over":[40],"demonstrated":[41],"trajectories.":[42],"However,":[43],"in":[44,51,63,69,99,126],"practical":[45],"applications":[46],"that":[47,166],"require":[48],"high":[49],"precision":[50],"the":[52,56,88,124,127,135,167,173],"manipulation":[53],"of":[54,58,114,143],"objects,":[55],"accuracy":[57],"ProMPs":[59,86],"often":[61],"insufficient,":[62],"particular":[64],"when":[65],"they":[66],"are":[67],"cartesian":[70],"space":[71,137],"external":[73],"observations":[74],"executed":[76],"with":[77,87,119,156,180],"limited":[78],"controller":[79],"gains.":[80],"Therefore,":[81],"we":[82,108,145],"propose":[83],"combine":[85],"Residual":[89],"Reinforcement":[90],"Learning":[91],"(RRL)":[92],"framework,":[93],"account":[95],"both,":[97],"corrections":[98],"position":[100],"orientation":[102],"during":[103],"task":[104,155],"execution.":[105],"In":[106],"particular,":[107],"residual":[111],"on":[112,150],"top":[113],"nominal":[116],"ProMP":[117],"Soft":[120],"Actor-Critic":[121],"incorporate":[123],"variability":[125],"demonstrations":[128],"as":[129],"decision":[131],"variable":[132],"reduce":[134],"search":[136],"RRL.":[139],"As":[140],"proof":[142],"concept,":[144],"evaluate":[146],"our":[147],"proposed":[148],"method":[149],"3D":[152],"block":[153],"insertion":[154],"7-DoF":[158],"Franka":[159],"Emika":[160],"Panda":[161],"robot.":[162],"Experimental":[163],"results":[164],"show":[165],"robot":[168],"successfully":[169],"learns":[170],"complete":[172],"insertion,":[174],"which":[175],"was":[176],"not":[177],"possible":[178],"before":[179],"using":[181],"basic":[182],"ProMPs.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
