{"id":"https://openalex.org/W4210478179","doi":"https://doi.org/10.1109/lra.2022.3146903","title":"Closed-Loop Dynamic Control of a Soft Manipulator Using Deep Reinforcement Learning","display_name":"Closed-Loop Dynamic Control of a Soft Manipulator Using Deep Reinforcement Learning","publication_year":2022,"publication_date":"2022-01-31","ids":{"openalex":"https://openalex.org/W4210478179","doi":"https://doi.org/10.1109/lra.2022.3146903"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2022.3146903","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2022.3146903","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://orbit.dtu.dk/en/publications/0eac04fb-684c-4ed2-bf1b-a7d9a342655c","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012526977","display_name":"Andrea Centurelli","orcid":null},"institutions":[{"id":"https://openalex.org/I162290304","display_name":"Scuola Superiore Sant'Anna","ror":"https://ror.org/025602r80","country_code":"IT","type":"education","lineage":["https://openalex.org/I162290304"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Andrea Centurelli","raw_affiliation_strings":["BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","institution_ids":["https://openalex.org/I162290304"]},{"raw_affiliation_string":"Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy","institution_ids":["https://openalex.org/I162290304"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086190512","display_name":"Luca Arleo","orcid":"https://orcid.org/0000-0002-2179-0684"},"institutions":[{"id":"https://openalex.org/I162290304","display_name":"Scuola Superiore Sant'Anna","ror":"https://ror.org/025602r80","country_code":"IT","type":"education","lineage":["https://openalex.org/I162290304"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Luca Arleo","raw_affiliation_strings":["BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","institution_ids":["https://openalex.org/I162290304"]},{"raw_affiliation_string":"Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy","institution_ids":["https://openalex.org/I162290304"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016579788","display_name":"Alessandro Rizzo","orcid":"https://orcid.org/0000-0002-2386-3146"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessandro Rizzo","raw_affiliation_strings":["Department of Electronics and Telecommunications, Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Telecommunications, Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048001312","display_name":"Silvia Tolu","orcid":"https://orcid.org/0000-0003-1825-8440"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Silvia Tolu","raw_affiliation_strings":["Department of Electrical Engineering (Automation and Control), Technical University of Denmark, Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering (Automation and Control), Technical University of Denmark, Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045065209","display_name":"Cecilia Laschi","orcid":"https://orcid.org/0000-0001-5248-1043"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Cecilia Laschi","raw_affiliation_strings":["Department of Mechanical Engineering, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033570527","display_name":"Egidio Falotico","orcid":"https://orcid.org/0000-0001-8060-8080"},"institutions":[{"id":"https://openalex.org/I162290304","display_name":"Scuola Superiore Sant'Anna","ror":"https://ror.org/025602r80","country_code":"IT","type":"education","lineage":["https://openalex.org/I162290304"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Egidio Falotico","raw_affiliation_strings":["BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"BioRobotics Institute, Scuola Superiore Sant&#x2019;Anna, Pontedera, Italy","institution_ids":["https://openalex.org/I162290304"]},{"raw_affiliation_string":"Department of Excellence in Robotics and AI, Scuola Superiore Sant'Anna, Pisa, Italy","institution_ids":["https://openalex.org/I162290304"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5012526977"],"corresponding_institution_ids":["https://openalex.org/I162290304"],"apc_list":null,"apc_paid":null,"fwci":6.4572,"has_fulltext":false,"cited_by_count":82,"citation_normalized_percentile":{"value":0.97801757,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"7","issue":"2","first_page":"4741","last_page":"4748"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11486","display_name":"Micro and Nano Robotics","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/3104","display_name":"Condensed Matter Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7159281373023987},{"id":"https://openalex.org/keywords/loop","display_name":"Loop (graph theory)","score":0.6259455680847168},{"id":"https://openalex.org/keywords/manipulator","display_name":"Manipulator (device)","score":0.581504762172699},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5569291114807129},{"id":"https://openalex.org/keywords/closed-loop","display_name":"Closed loop","score":0.4831523299217224},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47944775223731995},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.460582435131073},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.44615134596824646},{"id":"https://openalex.org/keywords/robot-manipulator","display_name":"Robot manipulator","score":0.44546428322792053},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30844852328300476},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2842090129852295},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.19197124242782593},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17990830540657043}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7159281373023987},{"id":"https://openalex.org/C184670325","wikidata":"https://www.wikidata.org/wiki/Q512604","display_name":"Loop (graph theory)","level":2,"score":0.6259455680847168},{"id":"https://openalex.org/C2781347998","wikidata":"https://www.wikidata.org/wiki/Q1587588","display_name":"Manipulator (device)","level":3,"score":0.581504762172699},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5569291114807129},{"id":"https://openalex.org/C3019251811","wikidata":"https://www.wikidata.org/wiki/Q5135346","display_name":"Closed loop","level":2,"score":0.4831523299217224},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47944775223731995},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.460582435131073},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.44615134596824646},{"id":"https://openalex.org/C2985527887","wikidata":"https://www.wikidata.org/wiki/Q1587588","display_name":"Robot manipulator","level":3,"score":0.44546428322792053},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30844852328300476},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2842090129852295},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.19197124242782593},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17990830540657043},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/lra.2022.3146903","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2022.3146903","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:publications/0eac04fb-684c-4ed2-bf1b-a7d9a342655c","is_oa":true,"landing_page_url":"https://orbit.dtu.dk/en/publications/0eac04fb-684c-4ed2-bf1b-a7d9a342655c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400705","display_name":"Technical University of Denmark, DTU Orbit (Technical University of Denmark, DTU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I96673099","host_organization_name":"Technical University of Denmark","host_organization_lineage":["https://openalex.org/I96673099"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Centurelli , A , Arleo , L , Rizzo , A , Tolu , S , Laschi , C &amp; Falotico , E 2022 , ' Closed-loop Dynamic Control of a Soft Manipulator using Deep Reinforcement Learning ' , IEEE Robotics and Automation Letters , vol. 7 , no. 2 , pp. 4741-4748 . https://doi.org/10.1109/LRA.2022.3146903","raw_type":"article"},{"id":"pmh:oai:www.iris.sssup.it:11382/544564","is_oa":false,"landing_page_url":"http://hdl.handle.net/11382/544564","pdf_url":null,"source":{"id":"https://openalex.org/S4377196376","display_name":"CINECA IRIS Institutional Research Information System (Sant'Anna School of Advanced Studies)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I162290304","host_organization_name":"Scuola Superiore Sant'Anna","host_organization_lineage":["https://openalex.org/I162290304"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:zenodo.org:11162207","is_oa":true,"landing_page_url":"https://doi.org/10.1109/LRA.2022.3146903","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Robotics and Automation Letters, 7(2), 4741 - 4748, (2022-01-31)","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:publications/0eac04fb-684c-4ed2-bf1b-a7d9a342655c","is_oa":true,"landing_page_url":"https://orbit.dtu.dk/en/publications/0eac04fb-684c-4ed2-bf1b-a7d9a342655c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400705","display_name":"Technical University of Denmark, DTU Orbit (Technical University of Denmark, DTU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I96673099","host_organization_name":"Technical University of Denmark","host_organization_lineage":["https://openalex.org/I96673099"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Centurelli , A , Arleo , L , Rizzo , A , Tolu , S , Laschi , C &amp; Falotico , E 2022 , ' Closed-loop Dynamic Control of a Soft Manipulator using Deep Reinforcement Learning ' , IEEE Robotics and Automation Letters , vol. 7 , no. 2 , pp. 4741-4748 . https://doi.org/10.1109/LRA.2022.3146903","raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5099999904632568}],"awards":[{"id":"https://openalex.org/G2657901741","display_name":null,"funder_award_id":"863212","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1997060717","https://openalex.org/W2063507564","https://openalex.org/W2064675550","https://openalex.org/W2065682774","https://openalex.org/W2096645690","https://openalex.org/W2101433417","https://openalex.org/W2490314460","https://openalex.org/W2495535193","https://openalex.org/W2508900105","https://openalex.org/W2560730116","https://openalex.org/W2605807134","https://openalex.org/W2621077460","https://openalex.org/W2739636222","https://openalex.org/W2782435507","https://openalex.org/W2901112449","https://openalex.org/W2947094677","https://openalex.org/W2967429195","https://openalex.org/W2990316883","https://openalex.org/W3035790680","https://openalex.org/W3107758180","https://openalex.org/W3110084462","https://openalex.org/W3133349997","https://openalex.org/W3133933269","https://openalex.org/W3158338937","https://openalex.org/W3180197665","https://openalex.org/W3205667999","https://openalex.org/W6638018090"],"related_works":["https://openalex.org/W2322335058","https://openalex.org/W2259382430","https://openalex.org/W2397460850","https://openalex.org/W2391397427","https://openalex.org/W4322484979","https://openalex.org/W1996341361","https://openalex.org/W4366609476","https://openalex.org/W2078127841","https://openalex.org/W2612895087","https://openalex.org/W2156518980"],"abstract_inverted_index":{"The":[0,95,118,135],"focus":[1],"of":[2,20,49,104,132,155],"the":[3,7,18,47,105,130,133,139,153,156],"research":[4],"community":[5],"in":[6,99,129,143],"soft":[8],"robotic":[9,26],"field":[10],"has":[11],"been":[12,62],"on":[13,57],"developing":[14],"innovative":[15],"materials,":[16],"but":[17],"design":[19],"control":[21],"strategies":[22],"applicable":[23],"to":[24,36,44,68,152],"these":[25,72],"platforms":[27],"is":[28,34,42,141],"still":[29],"an":[30,102],"open":[31],"challenge.":[32],"This":[33,74],"due":[35],"their":[37],"highly":[38],"nonlinear":[39],"dynamics":[40],"which":[41],"difficult":[43],"model":[45,109],"and":[46,147],"degree":[48],"stochasticity":[50],"they":[51],"often":[52],"incorporate.":[53],"Data-driven":[54],"controllers":[55],"based":[56],"neural":[58,78],"networks":[59],"have":[60],"recently":[61],"explored":[63],"as":[64],"a":[65,77,84,112,149],"viable":[66],"solution":[67],"be":[69],"employed":[70],"for":[71],"manipulators.":[73],"letter":[75],"presents":[76],"network-based":[79],"closed-loop":[80],"controller,":[81],"trained":[82,119],"by":[83],"deep":[85],"reinforcement":[86],"learning":[87],"algorithm":[88],"called":[89],"Trust":[90],"Region":[91],"Policy":[92],"Optimization":[93],"(TRPO).":[94],"training":[96],"takes":[97],"place":[98],"simulation,":[100],"using":[101],"approximation":[103],"robot":[106],"forward":[107],"dynamic":[108],"obtained":[110],"with":[111,126,148],"Long-short":[113],"Term":[114],"Memory":[115],"(LSTM)":[116],"network.":[117],"controller":[120,140],"allows":[121],"following":[122],"different":[123,127],"paths":[124],"executed":[125],"velocities":[128],"workspace":[131],"robot.":[134],"results":[136],"demonstrate":[137],"that":[138],"effective":[142],"normal":[144],"working":[145],"conditions":[146],"payload":[150],"attached":[151],"end-effector":[154],"manipulator.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":26},{"year":2024,"cited_by_count":29},{"year":2023,"cited_by_count":22},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2022-02-08T00:00:00"}
