{"id":"https://openalex.org/W4313563129","doi":"https://doi.org/10.1109/humanoids53995.2022.10000225","title":"Dynamic Bipedal Turning through Sim-to-Real Reinforcement Learning","display_name":"Dynamic Bipedal Turning through Sim-to-Real Reinforcement Learning","publication_year":2022,"publication_date":"2022-11-28","ids":{"openalex":"https://openalex.org/W4313563129","doi":"https://doi.org/10.1109/humanoids53995.2022.10000225"},"language":"en","primary_location":{"id":"doi:10.1109/humanoids53995.2022.10000225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids53995.2022.10000225","pdf_url":null,"source":{"id":"https://openalex.org/S4363608580","display_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017322738","display_name":"Fangzhou Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Fangzhou Yu","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020195251","display_name":"Ryan Batke","orcid":null},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Batke","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025328125","display_name":"Jeremy Dao","orcid":null},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeremy Dao","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026407792","display_name":"Jonathan Hurst","orcid":null},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Hurst","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014224596","display_name":"Kevin Green","orcid":"https://orcid.org/0000-0003-3922-4426"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kevin Green","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030052689","display_name":"Alan Fern","orcid":"https://orcid.org/0000-0001-5851-8935"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alan Fern","raw_affiliation_strings":["Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331"],"affiliations":[{"raw_affiliation_string":"Collaborative Robotics and Intelligent Systems Institute, Oregon State University,Corvallis,Oregon,USA,97331","institution_ids":["https://openalex.org/I131249849"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5017322738"],"corresponding_institution_ids":["https://openalex.org/I131249849"],"apc_list":null,"apc_paid":null,"fwci":4.1684,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.96047073,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"903","last_page":"910"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9616000056266785,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.829181432723999},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.742828369140625},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6787419319152832},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6669447422027588},{"id":"https://openalex.org/keywords/robot-locomotion","display_name":"Robot locomotion","score":0.601144552230835},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5031101107597351},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49441099166870117},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4673961102962494},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.46297380328178406},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4524766206741333},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.36427852511405945},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.35139065980911255},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.24939191341400146},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.19701850414276123}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.829181432723999},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.742828369140625},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6787419319152832},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6669447422027588},{"id":"https://openalex.org/C6101204","wikidata":"https://www.wikidata.org/wiki/Q7353391","display_name":"Robot locomotion","level":5,"score":0.601144552230835},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5031101107597351},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49441099166870117},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4673961102962494},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.46297380328178406},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4524766206741333},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.36427852511405945},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.35139065980911255},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.24939191341400146},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.19701850414276123},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/humanoids53995.2022.10000225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids53995.2022.10000225","pdf_url":null,"source":{"id":"https://openalex.org/S4363608580","display_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE-RAS 21st International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5301707831","display_name":null,"funder_award_id":"-16-1-0002","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G6665785327","display_name":null,"funder_award_id":"IIS-1849343,1314109-DGE","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W256081288","https://openalex.org/W1945123189","https://openalex.org/W2061983716","https://openalex.org/W2101340954","https://openalex.org/W2601610124","https://openalex.org/W2726187156","https://openalex.org/W2736601468","https://openalex.org/W2806858658","https://openalex.org/W2883488766","https://openalex.org/W2899718839","https://openalex.org/W2907537824","https://openalex.org/W2911087563","https://openalex.org/W2968213087","https://openalex.org/W2968764556","https://openalex.org/W3003936490","https://openalex.org/W3038194455","https://openalex.org/W3093922502","https://openalex.org/W3104876774","https://openalex.org/W3109689575","https://openalex.org/W3147968035","https://openalex.org/W3176539729","https://openalex.org/W3181074849","https://openalex.org/W3206762371","https://openalex.org/W4214717370","https://openalex.org/W4223604247","https://openalex.org/W4229044820","https://openalex.org/W4286611302","https://openalex.org/W4293160779","https://openalex.org/W4312900898","https://openalex.org/W4313563020","https://openalex.org/W6782175187"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4323768008","https://openalex.org/W1941703695","https://openalex.org/W2139139490","https://openalex.org/W2517926463","https://openalex.org/W2168918646","https://openalex.org/W2283275227","https://openalex.org/W2655458901"],"abstract_inverted_index":{"For":[0],"legged":[1,64,97],"robots":[2,65],"to":[3,58,105,144],"match":[4],"the":[5,147],"athletic":[6],"capabilities":[7],"of":[8,40,63,83],"humans":[9],"and":[10,20,30,139],"animals,":[11],"they":[12],"must":[13],"not":[14],"only":[15],"produce":[16,59],"robust":[17,71],"periodic":[18],"walking":[19,72],"running,":[21],"but":[22],"also":[23],"seamlessly":[24],"switch":[25],"between":[26],"nominal":[27],"locomotion":[28],"gaits":[29],"more":[31],"specialized":[32],"transient":[33],"maneuvers.":[34],"Despite":[35],"recent":[36],"advancements":[37],"in":[38,69],"controls":[39],"bipedal":[41,148],"robots,":[42,98],"there":[43],"has":[44],"been":[45],"little":[46],"focus":[47],"on":[48,86,146],"producing":[49,70],"highly":[50],"dynamic":[51],"behaviors.":[52,73],"Recent":[53],"work":[54,100],"utilizing":[55],"reinforcement":[56],"learning":[57,132],"policies":[60,77],"for":[61,96,131],"control":[62,94],"have":[66,78],"demonstrated":[67],"success":[68],"However,":[74],"these":[75],"learned":[76],"difficulty":[79],"expressing":[80],"a":[81,87,102,124,141],"multitude":[82],"different":[84],"behaviors":[85,134],"single":[88,117],"network.":[89],"Inspired":[90],"by":[91],"conventional":[92],"optimization-based":[93],"techniques":[95],"this":[99],"applies":[101],"recurrent":[103],"policy":[104],"execute":[106],"four-step,":[107],"90\u00b0":[108],"turns":[109],"trained":[110],"using":[111,127],"reference":[112],"data":[113,138],"generated":[114],"from":[115,135],"optimized":[116],"rigid":[118],"body":[119],"model":[120],"trajectories.":[121],"We":[122],"present":[123],"training":[125],"framework":[126],"epilogue":[128],"terminal":[129],"rewards":[130],"specific":[133],"pre-computed":[136],"trajectory":[137],"demonstrate":[140],"successful":[142],"transfer":[143],"hardware":[145],"robot":[149],"Cassie.":[150]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3}],"updated_date":"2026-02-25T08:12:03.925757","created_date":"2025-10-10T00:00:00"}
