{"id":"https://openalex.org/W4366774499","doi":"https://doi.org/10.3390/robotics12020061","title":"An Incremental Inverse Reinforcement Learning Approach for Motion Planning with Separated Path and Velocity Preferences","display_name":"An Incremental Inverse Reinforcement Learning Approach for Motion Planning with Separated Path and Velocity Preferences","publication_year":2023,"publication_date":"2023-04-20","ids":{"openalex":"https://openalex.org/W4366774499","doi":"https://doi.org/10.3390/robotics12020061"},"language":"en","primary_location":{"id":"doi:10.3390/robotics12020061","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12020061","pdf_url":"https://www.mdpi.com/2218-6581/12/2/61/pdf?version=1682059317","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2218-6581/12/2/61/pdf?version=1682059317","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061416006","display_name":"Armin Avaei","orcid":null},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Armin Avaei","raw_affiliation_strings":["Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080345874","display_name":"Linda van der Spaa","orcid":"https://orcid.org/0000-0002-6062-3141"},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]},{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["DE","NL"],"is_corresponding":true,"raw_author_name":"Linda van der Spaa","raw_affiliation_strings":["Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands","Honda Research Institute Europe, 63073 Offenbach am Main, Germany"],"raw_orcid":"https://orcid.org/0000-0002-6062-3141","affiliations":[{"raw_affiliation_string":"Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]},{"raw_affiliation_string":"Honda Research Institute Europe, 63073 Offenbach am Main, Germany","institution_ids":["https://openalex.org/I4210112253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042113474","display_name":"Luka Peternel","orcid":"https://orcid.org/0000-0002-8696-3689"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Luka Peternel","raw_affiliation_strings":["Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-8696-3689","affiliations":[{"raw_affiliation_string":"Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035229829","display_name":"Jens Kober","orcid":"https://orcid.org/0000-0001-7257-5434"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Jens Kober","raw_affiliation_strings":["Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0001-7257-5434","affiliations":[{"raw_affiliation_string":"Cognitive Robotics, Delft University of Technology, 2628 CD Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5080345874"],"corresponding_institution_ids":["https://openalex.org/I4210112253","https://openalex.org/I98358874"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":1.9727,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.8589069,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"12","issue":"2","first_page":"61","last_page":"61"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6917173862457275},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6639024019241333},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6588178277015686},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6557964086532593},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.6193386316299438},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.605198085308075},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6015926599502563},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5650622844696045},{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.5330141186714172},{"id":"https://openalex.org/keywords/kinesthetic-learning","display_name":"Kinesthetic learning","score":0.5312772989273071},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.525642991065979},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5206350684165955},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5198181867599487},{"id":"https://openalex.org/keywords/programming-by-demonstration","display_name":"Programming by demonstration","score":0.46793362498283386},{"id":"https://openalex.org/keywords/robotic-arm","display_name":"Robotic arm","score":0.4586174488067627},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.438810795545578},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3548661470413208},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3365152180194855},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.17999348044395447},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12590858340263367},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11789754033088684}],"concepts":[{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6917173862457275},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6639024019241333},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6588178277015686},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6557964086532593},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.6193386316299438},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.605198085308075},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6015926599502563},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5650622844696045},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.5330141186714172},{"id":"https://openalex.org/C55457006","wikidata":"https://www.wikidata.org/wiki/Q3647098","display_name":"Kinesthetic learning","level":2,"score":0.5312772989273071},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.525642991065979},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5206350684165955},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5198181867599487},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.46793362498283386},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.4586174488067627},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.438810795545578},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3548661470413208},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3365152180194855},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.17999348044395447},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12590858340263367},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11789754033088684},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/robotics12020061","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12020061","pdf_url":"https://www.mdpi.com/2218-6581/12/2/61/pdf?version=1682059317","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:28218f8067f64d0daae35f6cb0d94463","is_oa":true,"landing_page_url":"https://doaj.org/article/28218f8067f64d0daae35f6cb0d94463","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, Vol 12, Iss 2, p 61 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2218-6581/12/2/61/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/robotics12020061","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics; Volume 12; Issue 2; Pages: 61","raw_type":"Text"},{"id":"pmh:oai:tudelft.nl:uuid:cfcf8ebd-8db4-4b5e-a174-6c0c16b21dfd","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:cfcf8ebd-8db4-4b5e-a174-6c0c16b21dfd","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"journal article"}],"best_oa_location":{"id":"doi:10.3390/robotics12020061","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12020061","pdf_url":"https://www.mdpi.com/2218-6581/12/2/61/pdf?version=1682059317","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G1877445164","display_name":null,"funder_award_id":"804907","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"}],"funders":[{"id":"https://openalex.org/F4320318240","display_name":"European Space Agency","ror":"https://ror.org/03wd9za21"},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4366774499.pdf"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W187005120","https://openalex.org/W1837766154","https://openalex.org/W1894373409","https://openalex.org/W1979117064","https://openalex.org/W2012204020","https://openalex.org/W2057134775","https://openalex.org/W2098774185","https://openalex.org/W2101392974","https://openalex.org/W2110304639","https://openalex.org/W2115166552","https://openalex.org/W2151498646","https://openalex.org/W2157289187","https://openalex.org/W2161819990","https://openalex.org/W2169498096","https://openalex.org/W2227909145","https://openalex.org/W2570503960","https://openalex.org/W2767508918","https://openalex.org/W2769520592","https://openalex.org/W2910123761","https://openalex.org/W2915070458","https://openalex.org/W2964177756","https://openalex.org/W3006303816","https://openalex.org/W3006334608","https://openalex.org/W3039563104","https://openalex.org/W3092948749","https://openalex.org/W3197594072","https://openalex.org/W3208223622","https://openalex.org/W4225737910","https://openalex.org/W6748210908","https://openalex.org/W6774122581"],"related_works":["https://openalex.org/W3111440524","https://openalex.org/W2051058708","https://openalex.org/W2558272010","https://openalex.org/W2068552404","https://openalex.org/W4392899229","https://openalex.org/W2921166921","https://openalex.org/W4385174651","https://openalex.org/W4320154428","https://openalex.org/W2773365182","https://openalex.org/W230475630"],"abstract_inverted_index":{"Humans":[0],"often":[1],"demonstrate":[2,116],"diverse":[3],"behaviors":[4],"due":[5],"to":[6,13,74,79,126,161],"their":[7,14,165],"personal":[8,19],"preferences,":[9],"for":[10,21,40],"instance,":[11],"related":[12],"individual":[15],"execution":[16],"style":[17],"or":[18],"margin":[20],"safety.":[22],"In":[23],"this":[24],"paper,":[25],"we":[26],"consider":[27],"the":[28,50,62,68,72,95,108,113,142,163],"problem":[29],"of":[30,90,102,112,122,146,172],"integrating":[31],"both":[32,80,106],"path":[33,52,69],"and":[34,53,70,83,110,140,144],"velocity":[35,54],"preferences":[36,55,97,125,166],"into":[37],"trajectory":[38,63],"planning":[39],"robotic":[41],"manipulators.":[42],"We":[43,59,86,115,129],"first":[44,67],"learn":[45],"reward":[46],"functions":[47],"that":[48,77,93,117,156],"represent":[49],"user":[51,84,151],"from":[56],"kinesthetic":[57],"demonstration.":[58],"then":[60,71],"optimize":[61],"in":[64,98,107,149],"two":[65],"steps,":[66],"velocity,":[73],"produce":[75],"trajectories":[76],"adhere":[78],"task":[81],"requirements":[82],"preferences.":[85],"design":[87],"a":[88,99,134,150,169],"set":[89],"parameterized":[91],"features":[92],"capture":[94],"fundamental":[96],"pick-and-place":[100],"type":[101],"object":[103],"transportation":[104],"task,":[105],"shape":[109],"timing":[111],"motion.":[114],"our":[118,131,147],"method":[119],"is":[120],"capable":[121],"generalizing":[123],"such":[124],"new":[127],"scenarios.":[128],"implement":[130],"algorithm":[132],"on":[133],"Franka":[135],"Emika":[136],"7-DoF":[137],"robot":[138,164],"arm":[139],"validate":[141],"functionality":[143],"flexibility":[145],"approach":[148],"study.":[152],"The":[153],"results":[154],"show":[155],"non-expert":[157],"users":[158],"are":[159],"able":[160],"teach":[162],"with":[167],"just":[168],"few":[170],"iterations":[171],"feedback.":[173]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
