{"id":"https://openalex.org/W2016765487","doi":"https://doi.org/10.1109/iros.2010.5649089","title":"Robot motor skill coordination with EM-based Reinforcement Learning","display_name":"Robot motor skill coordination with EM-based Reinforcement Learning","publication_year":2010,"publication_date":"2010-10-01","ids":{"openalex":"https://openalex.org/W2016765487","doi":"https://doi.org/10.1109/iros.2010.5649089","mag":"2016765487"},"language":"en","primary_location":{"id":"doi:10.1109/iros.2010.5649089","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2010.5649089","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE/RSJ International Conference on Intelligent Robots and Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036281885","display_name":"Petar Kormushev","orcid":"https://orcid.org/0000-0002-6677-3044"},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Petar Kormushev","raw_affiliation_strings":["Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","institution_ids":["https://openalex.org/I30771326"]},{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy","institution_ids":["https://openalex.org/I30771326"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048780399","display_name":"Sylvain Calinon","orcid":"https://orcid.org/0000-0002-9036-6799"},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Sylvain Calinon","raw_affiliation_strings":["Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","institution_ids":["https://openalex.org/I30771326"]},{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy","institution_ids":["https://openalex.org/I30771326"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044243940","display_name":"Darwin G. Caldwell","orcid":"https://orcid.org/0000-0002-6233-9961"},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Darwin G Caldwell","raw_affiliation_strings":["Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology, Genoa, Italy","institution_ids":["https://openalex.org/I30771326"]},{"raw_affiliation_string":"Advanced Robotics Department, Italian Institute of Technology (IIT), 16163 Genova, Italy","institution_ids":["https://openalex.org/I30771326"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5036281885"],"corresponding_institution_ids":["https://openalex.org/I30771326"],"apc_list":null,"apc_paid":null,"fwci":32.0676,"has_fulltext":false,"cited_by_count":264,"citation_normalized_percentile":{"value":0.99720072,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3232","last_page":"3237"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7221333980560303},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6857285499572754},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6850956082344055},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6587440967559814},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.5357652306556702},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.508571982383728},{"id":"https://openalex.org/keywords/motor-learning","display_name":"Motor learning","score":0.5046454668045044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4935802221298218},{"id":"https://openalex.org/keywords/motor-skill","display_name":"Motor skill","score":0.48978471755981445},{"id":"https://openalex.org/keywords/torque","display_name":"Torque","score":0.4580302834510803},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.45582374930381775},{"id":"https://openalex.org/keywords/robot-kinematics","display_name":"Robot kinematics","score":0.4556189179420471},{"id":"https://openalex.org/keywords/robotic-arm","display_name":"Robotic arm","score":0.4379946291446686},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4228404462337494},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.34578776359558105},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.2222413420677185},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1842544972896576},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.06805166602134705}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7221333980560303},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6857285499572754},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6850956082344055},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6587440967559814},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.5357652306556702},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.508571982383728},{"id":"https://openalex.org/C107690735","wikidata":"https://www.wikidata.org/wiki/Q852461","display_name":"Motor learning","level":2,"score":0.5046454668045044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4935802221298218},{"id":"https://openalex.org/C169976356","wikidata":"https://www.wikidata.org/wiki/Q13208902","display_name":"Motor skill","level":2,"score":0.48978471755981445},{"id":"https://openalex.org/C144171764","wikidata":"https://www.wikidata.org/wiki/Q48103","display_name":"Torque","level":2,"score":0.4580302834510803},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.45582374930381775},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.4556189179420471},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.4379946291446686},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4228404462337494},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.34578776359558105},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2222413420677185},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1842544972896576},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.06805166602134705},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iros.2010.5649089","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2010.5649089","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE/RSJ International Conference on Intelligent Robots and Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.174.8750","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.174.8750","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.calinon.ch/papers/Kormushev-IROS2010.pdf","raw_type":"text"},{"id":"pmh:oai:spiral.imperial.ac.uk:10044/1/26071","is_oa":false,"landing_page_url":"http://hdl.handle.net/10044/1/26071","pdf_url":null,"source":{"id":"https://openalex.org/S4306401396","display_name":"Spiral (Imperial College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I47508984","host_organization_name":"Imperial College London","host_organization_lineage":["https://openalex.org/I47508984"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2010 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W76142776","https://openalex.org/W200863839","https://openalex.org/W787204617","https://openalex.org/W1516801383","https://openalex.org/W1684361744","https://openalex.org/W1885639605","https://openalex.org/W1974849157","https://openalex.org/W1980440818","https://openalex.org/W1983392485","https://openalex.org/W1986014385","https://openalex.org/W2012392077","https://openalex.org/W2027457629","https://openalex.org/W2042882799","https://openalex.org/W2113698995","https://openalex.org/W2119717200","https://openalex.org/W2122777916","https://openalex.org/W2127107099","https://openalex.org/W2127572219","https://openalex.org/W2129515556","https://openalex.org/W2131908539","https://openalex.org/W2144741745","https://openalex.org/W2154543878","https://openalex.org/W2161872510","https://openalex.org/W2172968643","https://openalex.org/W2744055297"],"related_works":["https://openalex.org/W4385452609","https://openalex.org/W4313255720","https://openalex.org/W1992538606","https://openalex.org/W2548273422","https://openalex.org/W2160983430","https://openalex.org/W2749023251","https://openalex.org/W2794101066","https://openalex.org/W4296340444","https://openalex.org/W2161872510","https://openalex.org/W2117552637"],"abstract_inverted_index":{"We":[0],"present":[1],"an":[2,95],"approach":[3,63],"allowing":[4],"a":[5,27,31,67,81,98],"robot":[6,86],"to":[7,50,88,93],"acquire":[8],"new":[9],"motor":[10,17],"skills":[11],"by":[12],"learning":[13,77],"the":[14,52,59,85,90],"couplings":[15],"across":[16],"control":[18],"variables.":[19],"The":[20,62],"demonstrated":[21],"skill":[22,76],"is":[23,47,64],"first":[24],"encoded":[25],"in":[26],"compact":[28],"form":[29],"through":[30],"modified":[32],"version":[33],"of":[34,54],"Dynamic":[35],"Movement":[36],"Primitives":[37],"(DMP)":[38],"which":[39],"encapsulates":[40],"correlation":[41],"information.":[42],"Expectation-Maximization":[43],"based":[44],"Reinforcement":[45],"Learning":[46],"then":[48],"used":[49],"modulate":[51],"mixture":[53],"dynamical":[55],"systems":[56],"initialized":[57],"from":[58],"user's":[60],"demonstration.":[61],"evaluated":[65],"on":[66],"torque-controlled":[68],"7":[69],"DOFs":[70],"Barrett":[71],"WAM":[72],"robotic":[73],"arm.":[74],"Two":[75],"experiments":[78],"are":[79],"conducted:":[80],"reaching":[82],"task":[83],"where":[84],"needs":[87],"adapt":[89],"learned":[91],"movement":[92],"avoid":[94],"obstacle,":[96],"and":[97],"dynamic":[99],"pancake-flipping":[100],"task.":[101]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":30},{"year":2019,"cited_by_count":27},{"year":2018,"cited_by_count":30},{"year":2017,"cited_by_count":18},{"year":2016,"cited_by_count":23},{"year":2015,"cited_by_count":16},{"year":2014,"cited_by_count":18},{"year":2013,"cited_by_count":12},{"year":2012,"cited_by_count":13}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
