{"id":"https://openalex.org/W4401415879","doi":"https://doi.org/10.1109/icra57147.2024.10610069","title":"Reinforcement Learning for Blind Stair Climbing with Legged and Wheeled-Legged Robots","display_name":"Reinforcement Learning for Blind Stair Climbing with Legged and Wheeled-Legged Robots","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4401415879","doi":"https://doi.org/10.1109/icra57147.2024.10610069"},"language":"en","primary_location":{"id":"doi:10.1109/icra57147.2024.10610069","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10610069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079514022","display_name":"Simon Chamorro","orcid":null},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Simon Chamorro","raw_affiliation_strings":["&#x00C9;cole Polytechnique de Montr&#x00E9;al,Department of Computer and Software Engineering,Qu&#x00E9;bec,Canada"],"affiliations":[{"raw_affiliation_string":"&#x00C9;cole Polytechnique de Montr&#x00E9;al,Department of Computer and Software Engineering,Qu&#x00E9;bec,Canada","institution_ids":["https://openalex.org/I45683168"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041410798","display_name":"Victor Klemm","orcid":"https://orcid.org/0000-0002-6752-3397"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Victor Klemm","raw_affiliation_strings":["ETH Zurich,Robotic Systems Lab,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich,Robotic Systems Lab,Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057849114","display_name":"Miguel de la Iglesia Valls","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miguel de La Iglesia Valls","raw_affiliation_strings":["Ascento Robotics,Zurich,Switzerland"],"affiliations":[{"raw_affiliation_string":"Ascento Robotics,Zurich,Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075885606","display_name":"Christopher Pal","orcid":"https://orcid.org/0000-0001-6534-2114"},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Christopher Pal","raw_affiliation_strings":["&#x00C9;cole Polytechnique de Montr&#x00E9;al,Department of Computer and Software Engineering,Qu&#x00E9;bec,Canada"],"affiliations":[{"raw_affiliation_string":"&#x00C9;cole Polytechnique de Montr&#x00E9;al,Department of Computer and Software Engineering,Qu&#x00E9;bec,Canada","institution_ids":["https://openalex.org/I45683168"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083003222","display_name":"Roland Siegwart","orcid":"https://orcid.org/0000-0002-2760-7983"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Roland Siegwart","raw_affiliation_strings":["ETH Zurich,Autonomous Systems Lab,Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich,Autonomous Systems Lab,Switzerland","institution_ids":["https://openalex.org/I35440088"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5079514022"],"corresponding_institution_ids":["https://openalex.org/I45683168"],"apc_list":null,"apc_paid":null,"fwci":3.3338,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.92818017,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"8081","last_page":"8087"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8723814487457275},{"id":"https://openalex.org/keywords/legged-robot","display_name":"Legged robot","score":0.705750584602356},{"id":"https://openalex.org/keywords/stair-climbing","display_name":"Stair climbing","score":0.6946589946746826},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6902614831924438},{"id":"https://openalex.org/keywords/hill-climbing","display_name":"Hill climbing","score":0.6127310991287231},{"id":"https://openalex.org/keywords/climbing","display_name":"Climbing","score":0.586581826210022},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5861978530883789},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.533845067024231},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42453569173812866},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18929266929626465},{"id":"https://openalex.org/keywords/physical-medicine-and-rehabilitation","display_name":"Physical medicine and rehabilitation","score":0.110192209482193},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.05767422914505005}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8723814487457275},{"id":"https://openalex.org/C2779908020","wikidata":"https://www.wikidata.org/wiki/Q1424704","display_name":"Legged robot","level":3,"score":0.705750584602356},{"id":"https://openalex.org/C2776319952","wikidata":"https://www.wikidata.org/wiki/Q2451755","display_name":"Stair climbing","level":2,"score":0.6946589946746826},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6902614831924438},{"id":"https://openalex.org/C135450995","wikidata":"https://www.wikidata.org/wiki/Q820272","display_name":"Hill climbing","level":2,"score":0.6127310991287231},{"id":"https://openalex.org/C95038775","wikidata":"https://www.wikidata.org/wiki/Q22857","display_name":"Climbing","level":2,"score":0.586581826210022},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5861978530883789},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.533845067024231},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42453569173812866},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18929266929626465},{"id":"https://openalex.org/C99508421","wikidata":"https://www.wikidata.org/wiki/Q2678675","display_name":"Physical medicine and rehabilitation","level":1,"score":0.110192209482193},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.05767422914505005},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icra57147.2024.10610069","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10610069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},{"id":"pmh:oai:publications.polymtl.ca:59306","is_oa":false,"landing_page_url":"https://publications.polymtl.ca/59306/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401013","display_name":"PolyPublie (\u00c9cole Polytechnique de Montr\u00e9al)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45683168","host_organization_name":"Polytechnique Montr\u00e9al","host_organization_lineage":["https://openalex.org/I45683168"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Communication de conf\u00e9rence"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2046376809","https://openalex.org/W2158782408","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2779458783","https://openalex.org/W2911087563","https://openalex.org/W2940265767","https://openalex.org/W2951633861","https://openalex.org/W2963184939","https://openalex.org/W2964227158","https://openalex.org/W2968031102","https://openalex.org/W3003397085","https://openalex.org/W3012010640","https://openalex.org/W3093326211","https://openalex.org/W3093922502","https://openalex.org/W3101817006","https://openalex.org/W3104695585","https://openalex.org/W3104876774","https://openalex.org/W3109424835","https://openalex.org/W3175254947","https://openalex.org/W3176539729","https://openalex.org/W3213974477","https://openalex.org/W4205430897","https://openalex.org/W4250058668","https://openalex.org/W4292852788","https://openalex.org/W4292852808","https://openalex.org/W4312574175","https://openalex.org/W4383108204","https://openalex.org/W4383109371","https://openalex.org/W4387682164","https://openalex.org/W4387831910","https://openalex.org/W4401415792","https://openalex.org/W6638018090","https://openalex.org/W6692846177","https://openalex.org/W6741002519","https://openalex.org/W6800004206","https://openalex.org/W6801964084","https://openalex.org/W6846358943"],"related_works":["https://openalex.org/W2029973929","https://openalex.org/W2323112089","https://openalex.org/W2324058214","https://openalex.org/W3109128554","https://openalex.org/W4312590534","https://openalex.org/W4205407652","https://openalex.org/W4377138153","https://openalex.org/W4317738234","https://openalex.org/W2047426691","https://openalex.org/W3156781616"],"abstract_inverted_index":{"In":[0,69],"recent":[1],"years,":[2],"legged":[3],"and":[4,158,163],"wheeled-legged":[5],"robots":[6,29,160],"have":[7],"gained":[8],"prominence":[9],"for":[10,16,93,187],"tasks":[11],"in":[12,41,161,177],"environments":[13,112],"predominantly":[14],"created":[15],"humans":[17],"across":[18],"various":[19],"domains.":[20],"One":[21],"significant":[22],"challenge":[23],"faced":[24],"by":[25],"many":[26],"of":[27,67,83,107,128,135,147],"these":[28],"is":[30,132],"their":[31,39],"limited":[32],"capability":[33],"to":[34,57,63,71,90,173],"navigate":[35],"stairs,":[36],"which":[37,87],"hampers":[38],"functionality":[40],"multi-story":[42],"environments.":[43],"This":[44],"study":[45],"proposes":[46],"a":[47,59,64,80,136,148,181],"method":[48,167],"aimed":[49],"at":[50],"addressing":[51],"this":[52,188],"limitation,":[53],"employing":[54],"reinforcement":[55],"learning":[56],"develop":[58],"versatile":[60],"controller":[61],"applicable":[62],"wide":[65],"range":[66],"robots.":[68],"contrast":[70],"the":[72,84,97,105,117,129,133,140,143,169,178],"conventional":[73],"velocity-based":[74],"controllers,":[75],"our":[76,153,166],"approach":[77,131],"builds":[78],"upon":[79],"position-based":[81],"formulation":[82],"RL":[85],"task,":[86],"we":[88],"show":[89],"be":[91],"vital":[92],"stair":[94],"climbing.":[95],"Furthermore,":[96],"methodology":[98],"leverages":[99],"an":[100],"asymmetric":[101],"actor-critic":[102],"structure,":[103],"enabling":[104,142],"utilization":[106],"privileged":[108],"information":[109],"from":[110],"simulated":[111],"during":[113,122],"training":[114],"while":[115],"eliminating":[116],"reliance":[118],"on":[119,155],"exteroceptive":[120],"sensors":[121],"real-world":[123],"deployment.":[124],"Another":[125],"key":[126],"feature":[127],"proposed":[130],"incorporation":[134],"boolean":[137],"observation":[138],"within":[139],"controller,":[141],"activation":[144],"or":[145],"deactivation":[146],"stair-climbing":[149],"mode.":[150],"We":[151],"present":[152],"results":[154],"different":[156],"quadrupeds":[157],"bipedal":[159],"simulation":[162],"showcase":[164],"how":[165],"allows":[168],"balancing":[170],"robot":[171],"Ascento":[172],"climb":[174],"15cm":[175],"stairs":[176],"real":[179],"world,":[180],"task":[182],"that":[183],"was":[184],"previously":[185],"impossible":[186],"robot.":[189]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":13}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
