{"id":"https://openalex.org/W4404953378","doi":"https://doi.org/10.1109/humanoids58906.2024.10769793","title":"Robust Humanoid Walking on Compliant and Uneven Terrain with Deep Reinforcement Learning","display_name":"Robust Humanoid Walking on Compliant and Uneven Terrain with Deep Reinforcement Learning","publication_year":2024,"publication_date":"2024-11-22","ids":{"openalex":"https://openalex.org/W4404953378","doi":"https://doi.org/10.1109/humanoids58906.2024.10769793"},"language":"en","primary_location":{"id":"doi:10.1109/humanoids58906.2024.10769793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids58906.2024.10769793","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE-RAS 23rd International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.13619","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067779478","display_name":"Rohan Singh","orcid":"https://orcid.org/0000-0002-9399-618X"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]},{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Rohan P. Singh","raw_affiliation_strings":["National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","University of Tsukuba, Ibaraki, Japan","CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","institution_ids":["https://openalex.org/I73613424"]},{"raw_affiliation_string":"University of Tsukuba, Ibaraki, Japan","institution_ids":["https://openalex.org/I146399215"]},{"raw_affiliation_string":"CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014473932","display_name":"Mitsuharu Morisawa","orcid":"https://orcid.org/0000-0003-0056-4335"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Mitsuharu Morisawa","raw_affiliation_strings":["National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","institution_ids":["https://openalex.org/I73613424"]},{"raw_affiliation_string":"CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021406076","display_name":"Mehdi Benallegue","orcid":"https://orcid.org/0000-0001-7537-9498"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Mehdi Benallegue","raw_affiliation_strings":["National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","institution_ids":["https://openalex.org/I73613424"]},{"raw_affiliation_string":"CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101132534","display_name":"Zhaoming Xie","orcid":"https://orcid.org/0000-0002-6085-8178"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhaoming Xie","raw_affiliation_strings":["Stanford University,Department of Computer Science,USA","Department of Computer Science, Stanford University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stanford University,Department of Computer Science,USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Department of Computer Science, Stanford University, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091136016","display_name":"Fumio Kanehiro","orcid":"https://orcid.org/0000-0002-0277-3467"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]},{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Fumio Kanehiro","raw_affiliation_strings":["National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","University of Tsukuba, Ibaraki, Japan","CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory) IRL,Japan","institution_ids":["https://openalex.org/I73613424"]},{"raw_affiliation_string":"University of Tsukuba, Ibaraki, Japan","institution_ids":["https://openalex.org/I146399215"]},{"raw_affiliation_string":"CNRS-AIST JRL (Joint Robotics Laboratory) IRL, National Institute of Advanced Industrial Science and Technology (AIST), Japan","institution_ids":["https://openalex.org/I73613424"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5067779478"],"corresponding_institution_ids":["https://openalex.org/I146399215","https://openalex.org/I73613424"],"apc_list":null,"apc_paid":null,"fwci":1.1991,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.77530154,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"497","last_page":"504"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13354","display_name":"Genetics and Physical Performance","score":0.9575999975204468,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10441","display_name":"Muscle Physiology and Disorders","score":0.9434000253677368,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.7768442034721375},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.7753236889839172},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7262523174285889},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6852636933326721},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6563293933868408},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6175317764282227},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4850101172924042},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.4534097909927368}],"concepts":[{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.7768442034721375},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.7753236889839172},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7262523174285889},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6852636933326721},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6563293933868408},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6175317764282227},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4850101172924042},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.4534097909927368},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/humanoids58906.2024.10769793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids58906.2024.10769793","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE-RAS 23rd International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2504.13619","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.13619","pdf_url":"https://arxiv.org/pdf/2504.13619","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.13619","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.13619","pdf_url":"https://arxiv.org/pdf/2504.13619","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1987580649","https://openalex.org/W2034183217","https://openalex.org/W2114776783","https://openalex.org/W2128131727","https://openalex.org/W2133859362","https://openalex.org/W2158782408","https://openalex.org/W2220283420","https://openalex.org/W2569327030","https://openalex.org/W2787555781","https://openalex.org/W2913971027","https://openalex.org/W2967793392","https://openalex.org/W3006422628","https://openalex.org/W3011337332","https://openalex.org/W3038194455","https://openalex.org/W3093922502","https://openalex.org/W3148915740","https://openalex.org/W3176539729","https://openalex.org/W3205282600","https://openalex.org/W3206762371","https://openalex.org/W3206804182","https://openalex.org/W4205430897","https://openalex.org/W4313563049","https://openalex.org/W4313563148","https://openalex.org/W4317987839","https://openalex.org/W4321020593","https://openalex.org/W4385486316","https://openalex.org/W4385756663","https://openalex.org/W6741002519","https://openalex.org/W6778428183"],"related_works":["https://openalex.org/W2745063183","https://openalex.org/W4399671601","https://openalex.org/W1992962589","https://openalex.org/W4256317079","https://openalex.org/W2129850190","https://openalex.org/W2295425790","https://openalex.org/W3032871857","https://openalex.org/W3213331859","https://openalex.org/W4226458444","https://openalex.org/W4390637946"],"abstract_inverted_index":{"For":[0],"the":[1,33,42,69,98,107,117,124,135,157,168,178],"deployment":[2],"of":[3,35,44,126,156,180],"legged":[4],"robots":[5,50],"in":[6,75],"real-world":[7],"environments,":[8],"it":[9],"is":[10,59,137,201],"essential":[11],"to":[12,60,72,139,153,162],"develop":[13],"robust":[14,79],"locomotion":[15,46,95],"control":[16,151],"methods":[17],"for":[18,41,48,67,184,197],"challenging":[19,187],"terrains":[20,74,113,188],"that":[21,62,123],"may":[22],"exhibit":[23,140],"unexpected":[24],"deformability":[25],"and":[26,53,101,115,170,192,199],"irregularity.":[27],"In":[28],"this":[29,181],"paper,":[30],"we":[31,121,176],"explore":[32],"application":[34],"sim-to-real":[36],"deep":[37],"reinforcement":[38],"learning":[39],"(RL)":[40],"design":[43],"bipedal":[45,94,128],"controllers":[47],"humanoid":[49,84,109],"on":[51,81,106,167],"compliant":[52],"uneven":[54],"terrains.":[55],"Our":[56],"key":[57],"contribution":[58],"show":[61,102,177],"a":[63,82,127,149],"simple":[64],"training":[65,198],"curriculum":[66],"exposing":[68],"RL":[70],"agent":[71],"randomized":[73],"simulation":[76,174],"can":[77,131],"achieve":[78],"walking":[80,129,185],"real":[83],"robot":[85,136],"using":[86,97],"only":[87],"proprioceptive":[88],"feedback.":[89],"We":[90,147],"train":[91],"an":[92],"end-to-end":[93],"policy":[96,130,152,182],"proposed":[99],"approach,":[100],"extensive":[103],"real-robot":[104],"demonstration":[105],"HRP-5P":[108],"over":[110,186],"several":[111],"difficult":[112],"inside":[114],"outside":[116],"lab":[118],"environment.":[119],"Further,":[120],"argue":[122],"robustness":[125],"be":[132],"improved":[133],"if":[134],"allowed":[138],"aperiodic":[141],"motion":[142],"with":[143],"variable":[144],"stepping":[145],"frequency.":[146],"propose":[148],"new":[150],"enable":[154],"modification":[155],"observed":[158],"clock":[159],"signal,":[160],"leading":[161],"adaptive":[163],"gait":[164],"frequencies":[165],"depending":[166],"terrain":[169],"command":[171],"velocity.":[172],"Through":[173],"experiments,":[175],"effectiveness":[179],"specifically":[183],"by":[189],"controlling":[190],"swing":[191],"stance":[193],"durations.":[194],"The":[195],"code":[196],"evaluation":[200],"available":[202],"online.":[203],"https://github.com/rohanpsingh/LearningHumanoidWalking":[204]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":4}],"updated_date":"2026-05-13T08:25:38.343686","created_date":"2025-10-10T00:00:00"}
