{"id":"https://openalex.org/W4312235756","doi":"https://doi.org/10.1109/iros47612.2022.9981112","title":"Training Dynamic Motion Primitives using Deep Reinforcement Learning to Control a Robotic Tadpole","display_name":"Training Dynamic Motion Primitives using Deep Reinforcement Learning to Control a Robotic Tadpole","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W4312235756","doi":"https://doi.org/10.1109/iros47612.2022.9981112"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9981112","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981112","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048151769","display_name":"Imran Hameed","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Imran Hameed","raw_affiliation_strings":["The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103973713","display_name":"Xu Chao","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Xu Chao","raw_affiliation_strings":["The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056734737","display_name":"David Navarro-Alarc\u00f3n","orcid":"https://orcid.org/0000-0002-3426-6638"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"David Navarro-Alarcon","raw_affiliation_strings":["The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University,Department of Mechanical Engineering,Hong Kong,China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Mechanical Engineering, The Hong Kong Polytechnic University, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071742051","display_name":"Xingjian Jing","orcid":"https://orcid.org/0000-0003-3498-2180"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Xingjian Jing","raw_affiliation_strings":["City University of Hong Kong,Department of Mechanical Engineering,Hong Kong,China","Department of Mechanical Engineering, City University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"City University of Hong Kong,Department of Mechanical Engineering,Hong Kong,China","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Mechanical Engineering, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5048151769"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":0.9641,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.73581774,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8484163284301758},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7554675340652466},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6839674711227417},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6178056001663208},{"id":"https://openalex.org/keywords/motion-control","display_name":"Motion control","score":0.5821001529693604},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5483570098876953},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.5102279186248779},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4762934744358063},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.44403427839279175},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.426441490650177},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.35804176330566406}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8484163284301758},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7554675340652466},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6839674711227417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6178056001663208},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.5821001529693604},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5483570098876953},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.5102279186248779},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4762934744358063},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.44403427839279175},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.426441490650177},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.35804176330566406},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros47612.2022.9981112","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981112","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7900000214576721,"id":"https://metadata.un.org/sdg/14","display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1146793508","https://openalex.org/W1771410628","https://openalex.org/W2012204020","https://openalex.org/W2023600285","https://openalex.org/W2068275355","https://openalex.org/W2085467124","https://openalex.org/W2136719407","https://openalex.org/W2145339207","https://openalex.org/W2156174987","https://openalex.org/W2158782408","https://openalex.org/W2161395589","https://openalex.org/W2169712669","https://openalex.org/W2783034017","https://openalex.org/W2793128170","https://openalex.org/W2794308328","https://openalex.org/W2910988768","https://openalex.org/W2911087563","https://openalex.org/W2963428623","https://openalex.org/W2963864421","https://openalex.org/W2968717280","https://openalex.org/W3107524692","https://openalex.org/W3173314523","https://openalex.org/W3187133229","https://openalex.org/W4200294561","https://openalex.org/W6638018090","https://openalex.org/W6684921986"],"related_works":["https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W2165180011","https://openalex.org/W3165944253","https://openalex.org/W1886477626","https://openalex.org/W1532677580","https://openalex.org/W2724299411","https://openalex.org/W4365788246"],"abstract_inverted_index":{"Developing":[0],"a":[1,40,64,74,89,153],"good":[2],"control":[3,11,29,47],"strategy":[4],"for":[5,27,48],"biomimetic":[6],"robots":[7],"is":[8,117],"challenging.":[9],"Robust":[10],"methods":[12,22],"require":[13],"an":[14],"accurate":[15],"model":[16,155],"of":[17,32,67,125,133,142,156,163],"the":[18,28,83,95,101,115,123,130,157,161,164,172,177],"robot.":[19],"Nowadays,":[20],"model-free":[21,45],"are":[23],"being":[24],"extensively":[25],"explored":[26],"and":[30,70,97,114,139,148,166],"navigation":[31],"terrestrial":[33],"robots.":[34],"In":[35],"this":[36,108],"paper,":[37],"we":[38,56],"consider":[39],"novel":[41],"deep":[42,134],"reinforcement":[43,76,135],"learning-based":[44],"swimming":[46,111],"our":[49,150],"bio-inspired":[50],"robotic":[51],"tadpole.":[52],"To":[53],"realize":[54],"this,":[55],"utilize":[57],"dynamic":[58,143],"motion":[59,68,84,144],"primitives,":[60],"which":[61],"can":[62],"represent":[63],"large":[65],"range":[66],"behaviors,":[69],"combine":[71],"them":[72],"with":[73,137],"decoupled":[75],"learning":[77,136],"framework.":[78],"The":[79],"proposed":[80],"architecture":[81],"optimizes":[82],"primitives":[85],"first":[86],"to":[87,99,119,159,175],"develop":[88],"travelling":[90],"wave":[91],"undulation":[92],"pattern":[93],"in":[94],"tail":[96],"then":[98],"navigate":[100,120],"robot":[102,116,158,174],"along":[103],"different":[104],"predefined":[105],"paths.":[106],"Through":[107],"framework,":[109],"effective":[110],"gait":[112],"emerges,":[113],"able":[118],"well":[121],"on":[122,152,171],"surface":[124],"water.":[126],"This":[127],"framework":[128],"combines":[129],"optimization":[131],"potential":[132],"stability":[138],"generalization":[140],"properties":[141],"primitives.":[145],"We":[146],"train":[147],"test":[149],"method":[151,165],"simulated":[154],"demonstrate":[160],"effectiveness":[162],"also":[167],"conduct":[168],"experimental":[169],"testing":[170],"real":[173],"verify":[176],"results.":[178]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
