{"id":"https://openalex.org/W3203069471","doi":"https://doi.org/10.1109/tnnls.2021.3112718","title":"A Survey of Sim-to-Real Transfer Techniques Applied to Reinforcement Learning for Bioinspired Robots","display_name":"A Survey of Sim-to-Real Transfer Techniques Applied to Reinforcement Learning for Bioinspired Robots","publication_year":2021,"publication_date":"2021-09-29","ids":{"openalex":"https://openalex.org/W3203069471","doi":"https://doi.org/10.1109/tnnls.2021.3112718","mag":"3203069471"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2021.3112718","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3112718","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"review","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014928067","display_name":"Wei Zhu","orcid":"https://orcid.org/0000-0003-4251-1741"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Wei Zhu","raw_affiliation_strings":["Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan"],"raw_orcid":"https://orcid.org/0000-0003-4251-1741","affiliations":[{"raw_affiliation_string":"Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078971977","display_name":"Xian Guo","orcid":"https://orcid.org/0000-0003-3793-1207"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xian Guo","raw_affiliation_strings":["College of Artificial Intelligence, Institute of Robotics and Automatic Information System, Nankai University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0003-3793-1207","affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Institute of Robotics and Automatic Information System, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072945772","display_name":"Dai Owaki","orcid":"https://orcid.org/0000-0003-1217-3892"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Dai Owaki","raw_affiliation_strings":["Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058240917","display_name":"Kyo Kutsuzawa","orcid":"https://orcid.org/0000-0002-5326-7847"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kyo Kutsuzawa","raw_affiliation_strings":["Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan"],"raw_orcid":"https://orcid.org/0000-0002-5326-7847","affiliations":[{"raw_affiliation_string":"Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan","institution_ids":["https://openalex.org/I201537933"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060102825","display_name":"Mitsuhiro Hayashibe","orcid":"https://orcid.org/0000-0001-6179-5706"},"institutions":[{"id":"https://openalex.org/I201537933","display_name":"Tohoku University","ror":"https://ror.org/01dq60k83","country_code":"JP","type":"education","lineage":["https://openalex.org/I201537933"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Mitsuhiro Hayashibe","raw_affiliation_strings":["Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan"],"raw_orcid":"https://orcid.org/0000-0001-6179-5706","affiliations":[{"raw_affiliation_string":"Department of Robotics, Graduate School of Engineering, Tohoku University, Sendai, Japan","institution_ids":["https://openalex.org/I201537933"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5014928067"],"corresponding_institution_ids":["https://openalex.org/I201537933"],"apc_list":null,"apc_paid":null,"fwci":4.6178,"has_fulltext":false,"cited_by_count":72,"citation_normalized_percentile":{"value":0.95584575,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"34","issue":"7","first_page":"3444","last_page":"3459"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9350000023841858,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8472166061401367},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6589680910110474},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6582967042922974},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6580703258514404},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.5718135237693787},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.5043033361434937},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.4344245195388794},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41242825984954834},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.34955334663391113},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1634349822998047}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8472166061401367},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6589680910110474},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6582967042922974},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6580703258514404},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.5718135237693787},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.5043033361434937},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.4344245195388794},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41242825984954834},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.34955334663391113},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1634349822998047},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tnnls.2021.3112718","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3112718","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5892974444","display_name":null,"funder_award_id":"JP20KK0256","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":150,"referenced_works":["https://openalex.org/W1191599655","https://openalex.org/W1480363156","https://openalex.org/W1511334422","https://openalex.org/W1602448039","https://openalex.org/W1968818868","https://openalex.org/W1974546321","https://openalex.org/W1975987482","https://openalex.org/W2013207866","https://openalex.org/W2022365837","https://openalex.org/W2042882799","https://openalex.org/W2050630772","https://openalex.org/W2057527471","https://openalex.org/W2060914855","https://openalex.org/W2083456681","https://openalex.org/W2087617385","https://openalex.org/W2096001037","https://openalex.org/W2100235553","https://openalex.org/W2107726111","https://openalex.org/W2109572794","https://openalex.org/W2112025910","https://openalex.org/W2112361218","https://openalex.org/W2116336719","https://openalex.org/W2122116594","https://openalex.org/W2124695578","https://openalex.org/W2127515439","https://openalex.org/W2133932631","https://openalex.org/W2140135625","https://openalex.org/W2145339207","https://openalex.org/W2147828974","https://openalex.org/W2158782408","https://openalex.org/W2167340365","https://openalex.org/W2172158418","https://openalex.org/W2201581102","https://openalex.org/W2205427871","https://openalex.org/W2213381658","https://openalex.org/W2221633012","https://openalex.org/W2257979135","https://openalex.org/W2295809278","https://openalex.org/W2342662072","https://openalex.org/W2529601334","https://openalex.org/W2529658650","https://openalex.org/W2535437139","https://openalex.org/W2568667779","https://openalex.org/W2604726708","https://openalex.org/W2604883922","https://openalex.org/W2605924076","https://openalex.org/W2606327391","https://openalex.org/W2616430965","https://openalex.org/W2729615412","https://openalex.org/W2736601468","https://openalex.org/W2767050701","https://openalex.org/W2772589676","https://openalex.org/W2779458783","https://openalex.org/W2781726626","https://openalex.org/W2795903659","https://openalex.org/W2796290181","https://openalex.org/W2811406095","https://openalex.org/W2902125520","https://openalex.org/W2902907165","https://openalex.org/W2911087563","https://openalex.org/W2912971983","https://openalex.org/W2915496388","https://openalex.org/W2924656332","https://openalex.org/W2931363641","https://openalex.org/W2950125763","https://openalex.org/W2952165569","https://openalex.org/W2962812027","https://openalex.org/W2963095800","https://openalex.org/W2963184939","https://openalex.org/W2963221646","https://openalex.org/W2963277051","https://openalex.org/W2963411833","https://openalex.org/W2963786176","https://openalex.org/W2963864421","https://openalex.org/W2964043796","https://openalex.org/W2964114602","https://openalex.org/W2966477753","https://openalex.org/W2967236418","https://openalex.org/W2967998934","https://openalex.org/W2968340082","https://openalex.org/W2968717280","https://openalex.org/W2969329576","https://openalex.org/W2970228732","https://openalex.org/W2972127687","https://openalex.org/W2982316857","https://openalex.org/W2990747716","https://openalex.org/W2992335548","https://openalex.org/W3000213934","https://openalex.org/W3001803449","https://openalex.org/W3003647188","https://openalex.org/W3003817470","https://openalex.org/W3005581722","https://openalex.org/W3009295642","https://openalex.org/W3010768390","https://openalex.org/W3012370795","https://openalex.org/W3013699912","https://openalex.org/W3016972249","https://openalex.org/W3022566517","https://openalex.org/W3025606523","https://openalex.org/W3028676366","https://openalex.org/W3029509103","https://openalex.org/W3029641972","https://openalex.org/W3030981716","https://openalex.org/W3039737909","https://openalex.org/W3091304796","https://openalex.org/W3093922502","https://openalex.org/W3101442004","https://openalex.org/W3103532359","https://openalex.org/W3104515094","https://openalex.org/W3104876774","https://openalex.org/W3208176110","https://openalex.org/W4214717370","https://openalex.org/W4237733001","https://openalex.org/W4287978564","https://openalex.org/W4288626282","https://openalex.org/W4294578467","https://openalex.org/W4297669644","https://openalex.org/W6627932998","https://openalex.org/W6640290305","https://openalex.org/W6675999342","https://openalex.org/W6680657880","https://openalex.org/W6684921986","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6704571135","https://openalex.org/W6718092244","https://openalex.org/W6729130418","https://openalex.org/W6730038592","https://openalex.org/W6730111887","https://openalex.org/W6736742618","https://openalex.org/W6737937804","https://openalex.org/W6741002519","https://openalex.org/W6741010574","https://openalex.org/W6744563498","https://openalex.org/W6747473740","https://openalex.org/W6748885356","https://openalex.org/W6750251063","https://openalex.org/W6756908582","https://openalex.org/W6758741661","https://openalex.org/W6760951303","https://openalex.org/W6764169831","https://openalex.org/W6765121789","https://openalex.org/W6768093820","https://openalex.org/W6769609827","https://openalex.org/W6772683233","https://openalex.org/W6776438516","https://openalex.org/W6777091672","https://openalex.org/W6778428183","https://openalex.org/W6803169502","https://openalex.org/W6841112233"],"related_works":["https://openalex.org/W4241523039","https://openalex.org/W2360028903","https://openalex.org/W4280543773","https://openalex.org/W178231042","https://openalex.org/W2366083136","https://openalex.org/W2387622493","https://openalex.org/W1932132538","https://openalex.org/W2357832196","https://openalex.org/W1566252468","https://openalex.org/W4200375594"],"abstract_inverted_index":{"The":[0,136],"state-of-the-art":[1,49],"reinforcement":[2,24],"learning":[3,25],"(RL)":[4],"techniques":[5,50,98,108,143],"have":[6],"made":[7],"innumerable":[8],"advancements":[9],"in":[10,14,88,102,188],"robot":[11,58,165],"control,":[12],"especially":[13],"combination":[15],"with":[16],"deep":[17,23],"neural":[18],"networks":[19],"(DNNs),":[20],"known":[21],"as":[22],"(DRL).":[26],"In":[27],"this":[28],"article,":[29],"instead":[30],"of":[31,85,114,119,126,134,138,142],"reviewing":[32],"the":[33,82],"theoretical":[34],"studies":[35],"on":[36,185],"RL,":[37],"which":[38],"were":[39],"almost":[40],"fully":[41],"completed":[42],"several":[43],"decades":[44],"ago,":[45],"we":[46,91],"summarize":[47],"some":[48],"added":[51],"to":[52,70,77,97,145,182],"commonly":[53],"used":[54],"RL":[55,152,184],"frameworks":[56],"for":[57,151],"control.":[59],"We":[60,105,171],"mainly":[61],"review":[62,95],"bioinspired":[63],"robots":[64],"(BIRs)":[65],"because":[66],"they":[67],"can":[68],"learn":[69],"locomote":[71],"or":[72],"produce":[73],"natural":[74,169],"behaviors":[75],"similar":[76],"animals":[78],"and":[79,121,128,131,148,158,163,167],"humans.":[80],"With":[81],"ultimate":[83],"goal":[84],"practical":[86],"applications":[87],"real":[89],"world,":[90],"further":[92],"narrow":[93],"our":[94],"scope":[96],"that":[99],"could":[100],"aid":[101],"sim-to-real":[103],"transfer.":[104],"categorized":[106],"these":[107,139,177],"into":[109],"four":[110,140],"groups:":[111],"1)":[112],"use":[113,118,125,133],"accurate":[115,149],"simulators;":[116],"2)":[117],"kinematic":[120],"dynamic":[122],"models;":[123],"3)":[124],"hierarchical":[127],"distributed":[129],"controllers;":[130],"4)":[132],"demonstrations.":[135],"purposes":[137],"groups":[141],"are":[144],"supply":[146],"general":[147],"environments":[150],"training,":[153],"improve":[154],"sampling":[155],"efficiency,":[156],"divide":[157],"conquer":[159],"complex":[160],"motion":[161],"tasks":[162],"redundant":[164],"structures,":[166],"acquire":[168],"skills.":[170],"found":[172],"that,":[173],"by":[174],"synthetically":[175],"using":[176],"techniques,":[178],"it":[179],"is":[180],"possible":[181],"deploy":[183],"physical":[186],"BIRs":[187],"actuality.":[189]},"counts_by_year":[{"year":2026,"cited_by_count":14},{"year":2025,"cited_by_count":25},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":6}],"updated_date":"2026-05-18T08:16:58.900851","created_date":"2021-10-11T00:00:00"}
