{"id":"https://openalex.org/W4383109140","doi":"https://doi.org/10.1109/icra48891.2023.10160756","title":"Dextrous Tactile In-Hand Manipulation Using a Modular Reinforcement Learning Architecture","display_name":"Dextrous Tactile In-Hand Manipulation Using a Modular Reinforcement Learning Architecture","publication_year":2023,"publication_date":"2023-05-29","ids":{"openalex":"https://openalex.org/W4383109140","doi":"https://doi.org/10.1109/icra48891.2023.10160756"},"language":"en","primary_location":{"id":"doi:10.1109/icra48891.2023.10160756","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160756","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075436631","display_name":"Johannes Pitz","orcid":null},"institutions":[{"id":"https://openalex.org/I83041830","display_name":"Deggendorf Institute of Technology","ror":"https://ror.org/02kw5st29","country_code":"DE","type":"education","lineage":["https://openalex.org/I83041830"]},{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Johannes Pitz","raw_affiliation_strings":["DLR Institute of Robotics and Mechatronics, Technical University of Munich","Deggendorf Institute of Technology"],"affiliations":[{"raw_affiliation_string":"DLR Institute of Robotics and Mechatronics, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Deggendorf Institute of Technology","institution_ids":["https://openalex.org/I83041830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047970921","display_name":"Lennart R\u00f6stel","orcid":null},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]},{"id":"https://openalex.org/I83041830","display_name":"Deggendorf Institute of Technology","ror":"https://ror.org/02kw5st29","country_code":"DE","type":"education","lineage":["https://openalex.org/I83041830"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lennart R\u00f6stel","raw_affiliation_strings":["DLR Institute of Robotics and Mechatronics, Technical University of Munich","Deggendorf Institute of Technology"],"affiliations":[{"raw_affiliation_string":"DLR Institute of Robotics and Mechatronics, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Deggendorf Institute of Technology","institution_ids":["https://openalex.org/I83041830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043414969","display_name":"Leon Sievers","orcid":"https://orcid.org/0000-0001-6430-4618"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]},{"id":"https://openalex.org/I83041830","display_name":"Deggendorf Institute of Technology","ror":"https://ror.org/02kw5st29","country_code":"DE","type":"education","lineage":["https://openalex.org/I83041830"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Leon Sievers","raw_affiliation_strings":["DLR Institute of Robotics and Mechatronics, Technical University of Munich","Deggendorf Institute of Technology"],"affiliations":[{"raw_affiliation_string":"DLR Institute of Robotics and Mechatronics, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Deggendorf Institute of Technology","institution_ids":["https://openalex.org/I83041830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058972548","display_name":"Berthold B\u00e4uml","orcid":"https://orcid.org/0000-0002-4545-4765"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]},{"id":"https://openalex.org/I83041830","display_name":"Deggendorf Institute of Technology","ror":"https://ror.org/02kw5st29","country_code":"DE","type":"education","lineage":["https://openalex.org/I83041830"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Berthold B\u00e4uml","raw_affiliation_strings":["DLR Institute of Robotics and Mechatronics, Technical University of Munich","Deggendorf Institute of Technology"],"affiliations":[{"raw_affiliation_string":"DLR Institute of Robotics and Mechatronics, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Deggendorf Institute of Technology","institution_ids":["https://openalex.org/I83041830"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5075436631"],"corresponding_institution_ids":["https://openalex.org/I62916508","https://openalex.org/I83041830"],"apc_list":null,"apc_paid":null,"fwci":5.3847,"has_fulltext":false,"cited_by_count":30,"citation_normalized_percentile":{"value":0.96358356,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1852","last_page":"1858"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7284132242202759},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6779849529266357},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6156015992164612},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5871725678443909},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5310870409011841},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.43305402994155884},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.41623276472091675},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3810940682888031},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3621964454650879},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16928353905677795}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7284132242202759},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6779849529266357},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6156015992164612},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5871725678443909},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5310870409011841},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.43305402994155884},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.41623276472091675},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3810940682888031},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3621964454650879},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16928353905677795},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icra48891.2023.10160756","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160756","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},{"id":"pmh:oai:elib.dlr.de:195400","is_oa":false,"landing_page_url":"https://ieeexplore.ieee.org/document/10160756","pdf_url":null,"source":{"id":"https://openalex.org/S4377196266","display_name":"elib (German Aerospace Center)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2898391981","host_organization_name":"Deutsches Zentrum f\u00fcr Luft- und Raumfahrt e. V. (DLR)","host_organization_lineage":["https://openalex.org/I2898391981"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Konferenzbeitrag"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2090149479","https://openalex.org/W2134167019","https://openalex.org/W2885163910","https://openalex.org/W2963371290","https://openalex.org/W2963403143","https://openalex.org/W2963403593","https://openalex.org/W3203535725","https://openalex.org/W4223534396","https://openalex.org/W4226340130","https://openalex.org/W4293568259","https://openalex.org/W4304732338","https://openalex.org/W4312410889","https://openalex.org/W4383108265","https://openalex.org/W6753773310","https://openalex.org/W6803178138","https://openalex.org/W6810170190","https://openalex.org/W6846301785","https://openalex.org/W6846634178"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W2378076731","https://openalex.org/W20361778","https://openalex.org/W2024136090"],"abstract_inverted_index":{"Dextrous":[0],"in-hand":[1],"manipulation":[2],"with":[3,15,192],"a":[4,9,39,91,102,118,129,150,167,193],"multi-fingered":[5],"robotic":[6,183],"hand":[7,17],"is":[8,55,79,109,113,147],"challenging":[10],"task,":[11],"esp.":[12],"when":[13,25,76],"performed":[14],"the":[16,32,50,61,64,71,77,87,96,105,124,139,161,181],"oriented":[18],"upside":[19],"down,":[20],"demanding":[21],"permanent":[22],"force-closure,":[23],"and":[24],"no":[26],"external":[27,53],"sensors":[28,54],"are":[29],"used.":[30],"For":[31],"task":[33,88,112],"of":[34,52,63,89,95,134,170],"reorienting":[35,90],"an":[36,48,56,143],"object":[37,65],"to":[38,67,74,93],"given":[40],"goal":[41,78,99,187],"orientation":[42],"(vs.":[43],"infinitely":[44],"spinning":[45],"it":[46],"around":[47],"axis),":[49],"lack":[51],"additional":[57],"fundamental":[58],"challenge":[59],"as":[60,142],"state":[62,141],"has":[66,127],"be":[68,190],"estimated":[69,148],"all":[70,185],"time,":[72],"e.g.,":[73],"detect":[75],"reached.":[80],"In":[81,163],"this":[82],"paper,":[83],"we":[84,165],"show":[85],"that":[86],"cube":[92,140],"any":[94],"24":[97,186],"possible":[98],"orientations":[100,188],"in":[101,115],"\u03c0/2-raster":[103],"using":[104,117],"torque-controlled":[106],"DLR-Hand":[107],"II":[108],"possible.":[110],"The":[111],"learned":[114],"simulation":[116],"modular":[119],"deep":[120,151],"reinforcement":[121],"learning":[122],"architecture:":[123],"actual":[125],"policy":[126],"only":[128],"small":[130],"observation":[131],"time":[132],"window":[133],"0.5":[135],"s":[136],"but":[137],"gets":[138],"explicit":[144],"input":[145],"which":[146],"via":[149],"differentiable":[152],"particle":[153],"filter":[154],"trained":[155],"on":[156,180],"data":[157],"generated":[158],"by":[159],"running":[160],"policy.":[162],"simulation,":[164],"reach":[166],"success":[168,195],"rate":[169],"92%":[171],"while":[172],"applying":[173],"significant":[174],"domain":[175],"randomization.":[176],"Via":[177],"zero-shot":[178],"Sim2Real-transfer":[179],"real":[182],"system,":[184],"can":[189],"reached":[191],"high":[194],"rate.":[196],"(Web:":[197],"dlr-alr.github.io/dlr-tactile-manipulation)":[198]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":8}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2023-07-05T00:00:00"}
