{"id":"https://openalex.org/W3044051321","doi":"https://doi.org/10.1109/lra.2020.3010461","title":"Deep Reinforcement Learning for Tactile Robotics: Learning to Type on a Braille Keyboard","display_name":"Deep Reinforcement Learning for Tactile Robotics: Learning to Type on a Braille Keyboard","publication_year":2020,"publication_date":"2020-07-20","ids":{"openalex":"https://openalex.org/W3044051321","doi":"https://doi.org/10.1109/lra.2020.3010461","mag":"3044051321"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2020.3010461","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3010461","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2008.02646","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053354197","display_name":"Alex Church","orcid":"https://orcid.org/0000-0002-4062-5959"},"institutions":[{"id":"https://openalex.org/I4210161128","display_name":"Bristol Robotics Laboratory","ror":"https://ror.org/056sbyc67","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210161128"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alex Church","raw_affiliation_strings":["Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K"],"raw_orcid":"https://orcid.org/0000-0002-4062-5959","affiliations":[{"raw_affiliation_string":"Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K","institution_ids":["https://openalex.org/I4210161128"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025972235","display_name":"John W. Lloyd","orcid":"https://orcid.org/0000-0002-5630-683X"},"institutions":[{"id":"https://openalex.org/I4210161128","display_name":"Bristol Robotics Laboratory","ror":"https://ror.org/056sbyc67","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210161128"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"John Lloyd","raw_affiliation_strings":["Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K"],"raw_orcid":"https://orcid.org/0000-0002-5630-683X","affiliations":[{"raw_affiliation_string":"Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K","institution_ids":["https://openalex.org/I4210161128"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079415139","display_name":"Raia Hadsell","orcid":"https://orcid.org/0000-0002-2390-1771"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Raia Hadsell","raw_affiliation_strings":["Google DeepMind, London, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, U.K","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015897265","display_name":"Nathan F. Lepora","orcid":"https://orcid.org/0000-0001-5327-1523"},"institutions":[{"id":"https://openalex.org/I4210161128","display_name":"Bristol Robotics Laboratory","ror":"https://ror.org/056sbyc67","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210161128"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nathan F. Lepora","raw_affiliation_strings":["Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K"],"raw_orcid":"https://orcid.org/0000-0001-5327-1523","affiliations":[{"raw_affiliation_string":"Department of Engineering Mathematics and Bristol Robotics Laboratory, University of Bristol, Bristol, U.K","institution_ids":["https://openalex.org/I4210161128"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.8299,"has_fulltext":true,"cited_by_count":33,"citation_normalized_percentile":{"value":0.84444943,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"5","issue":"4","first_page":"6145","last_page":"6152"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10338","display_name":"Advanced Sensor and Energy Harvesting Materials","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10338","display_name":"Advanced Sensor and Energy Harvesting Materials","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/braille","display_name":"Braille","score":0.7879606485366821},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7842512726783752},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7314358353614807},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6067358255386353},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5561846494674683},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.5515244007110596},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5321401953697205},{"id":"https://openalex.org/keywords/alphabet","display_name":"Alphabet","score":0.5254166126251221},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5253709554672241},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5064622163772583},{"id":"https://openalex.org/keywords/tactile-sensor","display_name":"Tactile sensor","score":0.4161829352378845},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10260486602783203}],"concepts":[{"id":"https://openalex.org/C2778802812","wikidata":"https://www.wikidata.org/wiki/Q79894","display_name":"Braille","level":2,"score":0.7879606485366821},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7842512726783752},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7314358353614807},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6067358255386353},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5561846494674683},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5515244007110596},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5321401953697205},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.5254166126251221},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5253709554672241},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5064622163772583},{"id":"https://openalex.org/C46722567","wikidata":"https://www.wikidata.org/wiki/Q7674139","display_name":"Tactile sensor","level":3,"score":0.4161829352378845},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10260486602783203},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/lra.2020.3010461","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3010461","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2008.02646","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.02646","pdf_url":"https://arxiv.org/pdf/2008.02646","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:research-information.bris.ac.uk:publications/dd5880d5-8ece-4852-9d21-9c3895d71d44","is_oa":true,"landing_page_url":null,"pdf_url":"https://arxiv.org/abs/2008.02646","source":{"id":"https://openalex.org/S4306400895","display_name":"Bristol Research (University of Bristol)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I36234482","host_organization_name":"University of Bristol","host_organization_lineage":["https://openalex.org/I36234482"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:research-information.bris.ac.uk:publications/dd5880d5-8ece-4852-9d21-9c3895d71d44","is_oa":true,"landing_page_url":"https://research-information.bris.ac.uk/en/publications/dd5880d5-8ece-4852-9d21-9c3895d71d44","pdf_url":"https://arxiv.org/abs/2008.02646","source":{"id":"https://openalex.org/S7407055359","display_name":"Explore Bristol Research","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Church, A, Lloyd, J, Hadsell, R & Lepora, N F 2020, 'Deep Reinforcement Learning for Tactile Robotics: Learning to Type on a Braille Keyboard', IEEE Robotics and Automation Letters, vol. 5, no. 4, pp. 6145 - 6152. https://doi.org/10.1109/LRA.2020.3010461","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:research-information.bris.ac.uk:openaire_cris_publications/dd5880d5-8ece-4852-9d21-9c3895d71d44","is_oa":true,"landing_page_url":"https://hdl.handle.net/1983/dd5880d5-8ece-4852-9d21-9c3895d71d44","pdf_url":null,"source":{"id":"https://openalex.org/S7407055359","display_name":"Explore Bristol Research","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Church, A, Lloyd, J, Hadsell, R & Lepora, N F 2020, 'Deep Reinforcement Learning for Tactile Robotics: Learning to Type on a Braille Keyboard', IEEE Robotics and Automation Letters, vol. 5, no. 4, pp. 6145 - 6152. https://doi.org/10.1109/LRA.2020.3010461","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2008.02646","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.02646","pdf_url":"https://arxiv.org/pdf/2008.02646","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7099999785423279}],"awards":[{"id":"https://openalex.org/G7896653347","display_name":null,"funder_award_id":"RL-2016-39","funder_id":"https://openalex.org/F4320319993","funder_display_name":"Leverhulme Trust"}],"funders":[{"id":"https://openalex.org/F4320319993","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":82,"referenced_works":["https://openalex.org/W1771410628","https://openalex.org/W2145339207","https://openalex.org/W2150468603","https://openalex.org/W2155968351","https://openalex.org/W2173564293","https://openalex.org/W2201581102","https://openalex.org/W2340935928","https://openalex.org/W2342662072","https://openalex.org/W2567455162","https://openalex.org/W2610395436","https://openalex.org/W2736601468","https://openalex.org/W2746553466","https://openalex.org/W2761873684","https://openalex.org/W2765994785","https://openalex.org/W2781493652","https://openalex.org/W2781585732","https://openalex.org/W2781726626","https://openalex.org/W2785738552","https://openalex.org/W2787938642","https://openalex.org/W2789008106","https://openalex.org/W2804941773","https://openalex.org/W2885163910","https://openalex.org/W2890803796","https://openalex.org/W2903932337","https://openalex.org/W2904246096","https://openalex.org/W2923189133","https://openalex.org/W2946222143","https://openalex.org/W2950268955","https://openalex.org/W2951799221","https://openalex.org/W2963048676","https://openalex.org/W2963390419","https://openalex.org/W2963411833","https://openalex.org/W2963477884","https://openalex.org/W2963641140","https://openalex.org/W2963864421","https://openalex.org/W2963884015","https://openalex.org/W2963923407","https://openalex.org/W2964001908","https://openalex.org/W2964227158","https://openalex.org/W2964291307","https://openalex.org/W2968585391","https://openalex.org/W2980825073","https://openalex.org/W2981030070","https://openalex.org/W2990599087","https://openalex.org/W2990747716","https://openalex.org/W3015462157","https://openalex.org/W3029539653","https://openalex.org/W3030520603","https://openalex.org/W3098436915","https://openalex.org/W3100674903","https://openalex.org/W3103780890","https://openalex.org/W4235910938","https://openalex.org/W4288102901","https://openalex.org/W4293864724","https://openalex.org/W4293872189","https://openalex.org/W4298159277","https://openalex.org/W4300799055","https://openalex.org/W6638018090","https://openalex.org/W6684921986","https://openalex.org/W6685444567","https://openalex.org/W6687681856","https://openalex.org/W6704571135","https://openalex.org/W6737327832","https://openalex.org/W6740801417","https://openalex.org/W6741002519","https://openalex.org/W6744838376","https://openalex.org/W6745274615","https://openalex.org/W6747387971","https://openalex.org/W6747473740","https://openalex.org/W6747924173","https://openalex.org/W6748599296","https://openalex.org/W6748839928","https://openalex.org/W6749115525","https://openalex.org/W6754615820","https://openalex.org/W6757592117","https://openalex.org/W6760595886","https://openalex.org/W6767997047","https://openalex.org/W6768008868","https://openalex.org/W6769508795","https://openalex.org/W6771026745","https://openalex.org/W6780559895","https://openalex.org/W6785251640"],"related_works":["https://openalex.org/W1525606688","https://openalex.org/W2113415290","https://openalex.org/W2056248531","https://openalex.org/W2805875310","https://openalex.org/W2626963359","https://openalex.org/W291345902","https://openalex.org/W4312729156","https://openalex.org/W2043289164","https://openalex.org/W2058549332","https://openalex.org/W1994305585"],"abstract_inverted_index":{"Artificial":[0],"touch":[1],"would":[2],"seem":[3],"well-suited":[4],"for":[5,159,172,178],"Reinforcement":[6],"Learning":[7],"(RL),":[8],"since":[9],"both":[10],"paradigms":[11],"rely":[12],"on":[13,38,101,117],"interaction":[14],"with":[15,166],"an":[16],"environment.":[17,73],"Here":[18],"we":[19,79],"propose":[20],"a":[21,39,176],"new":[22],"environment":[23],"and":[24,54,92,175],"set":[25],"of":[26,31,83,95,107,123,132,147,168],"tasks":[27,43,85,97],"to":[28,36,51,57],"encourage":[29],"development":[30],"tactile":[32,68,148],"reinforcement":[33],"learning:":[34],"learning":[35],"type":[37],"braille":[40,170],"keyboard.":[41],"Four":[42],"are":[44],"proposed,":[45],"progressing":[46],"in":[47,90,138],"difficulty":[48],"from":[49,55,70],"arrow":[50],"alphabet":[52,114],"keys":[53],"discrete":[56],"continuous":[58,113],"actions.":[59],"A":[60,105],"simulated":[61],"counterpart":[62],"is":[63],"also":[64],"constructed":[65],"by":[66],"sampling":[67],"data":[69],"the":[71,102,112,118,121,129,139,157,169,180],"physical":[72],"Using":[74],"state-of-the-art":[75],"deep":[76,135],"RL":[77,136],"algorithms,":[78],"show":[80],"that":[81,144],"all":[82],"these":[84],"can":[86,98],"be":[87,99],"successfully":[88,133],"learnt":[89],"simulation,":[91],"3":[93],"out":[94],"4":[96],"learned":[100],"real":[103,140],"robot.":[104,119],"lack":[106],"sample":[108],"efficiency":[109],"currently":[110],"makes":[111],"task":[115],"impractical":[116],"To":[120,150],"best":[122],"our":[124],"knowledge,":[125],"this":[126,155,160],"work":[127],"presents":[128],"first":[130],"demonstration":[131],"training":[134],"agents":[137],"world":[141],"using":[142],"observations":[143],"exclusively":[145],"consist":[146],"images.":[149],"aid":[151],"future":[152],"research":[153],"utilising":[154],"environment,":[156],"code":[158],"project":[161],"has":[162],"been":[163],"released":[164],"along":[165],"designs":[167],"keycaps":[171],"3D":[173],"printing":[174],"guide":[177],"recreating":[179],"experiments.":[181]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2022-07-26T00:00:00"}
