{"id":"https://openalex.org/W3134580056","doi":"https://doi.org/10.1109/iros47612.2022.9982132","title":"Robust High-Speed Running for Quadruped Robots via Deep Reinforcement Learning","display_name":"Robust High-Speed Running for Quadruped Robots via Deep Reinforcement Learning","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W3134580056","doi":"https://doi.org/10.1109/iros47612.2022.9982132","mag":"3134580056"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9982132","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9982132","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.06484","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011177211","display_name":"Guillaume Bellegarda","orcid":"https://orcid.org/0000-0001-5809-3340"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guillaume Bellegarda","raw_affiliation_strings":["University of Southern California (USC),Dynamic Robotics and Control Laboratory","Dynamic Robotics and Control Laboratory, University of Southern California (USC)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Southern California (USC),Dynamic Robotics and Control Laboratory","institution_ids":["https://openalex.org/I4210116723"]},{"raw_affiliation_string":"Dynamic Robotics and Control Laboratory, University of Southern California (USC)","institution_ids":["https://openalex.org/I4210116723","https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102026597","display_name":"Yiyu Chen","orcid":"https://orcid.org/0000-0001-5651-0075"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiyu Chen","raw_affiliation_strings":["University of Southern California (USC),Dynamic Robotics and Control Laboratory","Dynamic Robotics and Control Laboratory, University of Southern California (USC)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Southern California (USC),Dynamic Robotics and Control Laboratory","institution_ids":["https://openalex.org/I4210116723"]},{"raw_affiliation_string":"Dynamic Robotics and Control Laboratory, University of Southern California (USC)","institution_ids":["https://openalex.org/I4210116723","https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009351026","display_name":"Zunying Liu","orcid":"https://orcid.org/0000-0002-2983-2332"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhuochen Liu","raw_affiliation_strings":["University of Southern California (USC),Dynamic Robotics and Control Laboratory","Dynamic Robotics and Control Laboratory, University of Southern California (USC)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Southern California (USC),Dynamic Robotics and Control Laboratory","institution_ids":["https://openalex.org/I4210116723"]},{"raw_affiliation_string":"Dynamic Robotics and Control Laboratory, University of Southern California (USC)","institution_ids":["https://openalex.org/I4210116723","https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036664594","display_name":"Quan Nguyen","orcid":"https://orcid.org/0000-0001-8937-5121"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Quan Nguyen","raw_affiliation_strings":["University of Southern California (USC),Dynamic Robotics and Control Laboratory","Dynamic Robotics and Control Laboratory, University of Southern California (USC)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Southern California (USC),Dynamic Robotics and Control Laboratory","institution_ids":["https://openalex.org/I4210116723"]},{"raw_affiliation_string":"Dynamic Robotics and Control Laboratory, University of Southern California (USC)","institution_ids":["https://openalex.org/I4210116723","https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":19.1646,"has_fulltext":false,"cited_by_count":65,"citation_normalized_percentile":{"value":0.99775011,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"10364","last_page":"10370"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7882670760154724},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7298038005828857},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.7241604924201965},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.6689429879188538},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6355502605438232},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5974113345146179},{"id":"https://openalex.org/keywords/offset","display_name":"Offset (computer science)","score":0.5135300755500793},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4614158570766449},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4605819582939148},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4510483145713806},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.39336681365966797},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.24960851669311523}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7882670760154724},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7298038005828857},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.7241604924201965},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.6689429879188538},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6355502605438232},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5974113345146179},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.5135300755500793},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4614158570766449},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4605819582939148},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4510483145713806},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.39336681365966797},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.24960851669311523},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros47612.2022.9982132","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9982132","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2103.06484","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.06484","pdf_url":"https://arxiv.org/pdf/2103.06484","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.06484","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.06484","pdf_url":"https://arxiv.org/pdf/2103.06484","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W1191599655","https://openalex.org/W1771410628","https://openalex.org/W2068923975","https://openalex.org/W2161427949","https://openalex.org/W2205975260","https://openalex.org/W2294151168","https://openalex.org/W2295809278","https://openalex.org/W2546975091","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2767050701","https://openalex.org/W2793991136","https://openalex.org/W2899496413","https://openalex.org/W2909331752","https://openalex.org/W2911087563","https://openalex.org/W2962902376","https://openalex.org/W2963184621","https://openalex.org/W2963184939","https://openalex.org/W2963193690","https://openalex.org/W2963923407","https://openalex.org/W2968268581","https://openalex.org/W2972810470","https://openalex.org/W2977527020","https://openalex.org/W3003629310","https://openalex.org/W3003669699","https://openalex.org/W3004070224","https://openalex.org/W3029641972","https://openalex.org/W3038194455","https://openalex.org/W3039737909","https://openalex.org/W3093922502","https://openalex.org/W3094276053","https://openalex.org/W3099547539","https://openalex.org/W3101442004","https://openalex.org/W3104876774","https://openalex.org/W3106462682","https://openalex.org/W3175254947","https://openalex.org/W3176539729","https://openalex.org/W3178099496","https://openalex.org/W3204973825","https://openalex.org/W3206762371","https://openalex.org/W3206938627","https://openalex.org/W3207491493","https://openalex.org/W3209211683","https://openalex.org/W3213886952","https://openalex.org/W4200429861","https://openalex.org/W4205430897","https://openalex.org/W4205967660","https://openalex.org/W4206589784","https://openalex.org/W4226143977","https://openalex.org/W4286963241","https://openalex.org/W4300892751","https://openalex.org/W4311443585","https://openalex.org/W6627932998","https://openalex.org/W6741002519","https://openalex.org/W6755667589","https://openalex.org/W6767349745","https://openalex.org/W6778428183","https://openalex.org/W6785466209","https://openalex.org/W6793715182","https://openalex.org/W6794173013","https://openalex.org/W6798487212","https://openalex.org/W6801064428","https://openalex.org/W6801964084","https://openalex.org/W6802654813","https://openalex.org/W6805081537"],"related_works":["https://openalex.org/W4399671601","https://openalex.org/W1992962589","https://openalex.org/W3032871857","https://openalex.org/W1743191351","https://openalex.org/W3104633800","https://openalex.org/W3023567978","https://openalex.org/W3044778482","https://openalex.org/W2914059119","https://openalex.org/W3040494141","https://openalex.org/W1977229594"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1],"learning":[2,24,31,74],"has":[3],"emerged":[4],"as":[5,137],"a":[6,73,155,186,215,221,247],"popular":[7],"and":[8,34,49,56,84,95,114,139,141,183,191,217],"powerful":[9],"way":[10],"to":[11,32,78,102,108,130,189,194,208,241],"develop":[12],"locomotion":[13],"controllers":[14],"for":[15,51,88,161],"quadruped":[16,89,177,205,232,256],"robots.":[17,90],"Common":[18],"approaches":[19,43],"have":[20],"largely":[21],"focused":[22],"on":[23],"actions":[25,97],"directly":[26,98],"in":[27,99,153,181],"joint":[28],"space,":[29],"or":[30],"modify":[33],"offset":[35],"foot":[36],"positions":[37],"produced":[38],"by":[39],"trajectory":[40,58],"generators.":[41],"Both":[42],"typically":[44],"require":[45],"careful":[46],"reward":[47,127],"shaping":[48],"training":[50],"millions":[52],"of":[53,82,133,164,171,174,229,253],"time":[54,158],"steps,":[55,159],"with":[57,169,220,246],"generators":[59],"introduce":[60],"human":[61],"bias":[62],"into":[63],"the":[64,79,131,143,175,195,204,230,236,254],"resulting":[65],"control":[66],"policies.":[67],"In":[68],"this":[69,120],"paper,":[70],"we":[71,184],"present":[72],"framework":[75,121],"that":[76,119],"leads":[77,129],"natural":[80,134],"emergence":[81,132],"fast":[83],"robust":[85],"bounding":[86],"policies":[87],"The":[91],"agent":[92],"both":[93],"selects":[94],"controls":[96],"task":[100],"space":[101],"track":[103],"desired":[104],"velocity":[105],"commands":[106],"subject":[107],"environmental":[109],"noise":[110],"including":[111],"model":[112],"uncertainty":[113],"rough":[115,167],"terrain.":[116],"We":[117],"observe":[118],"improves":[122],"sample":[123],"efficiency,":[124],"necessitates":[125],"little":[126],"shaping,":[128],"gaits":[135],"such":[136],"galloping":[138],"bounding,":[140],"eases":[142],"sim-to-real":[144,192],"transfer":[145,188,193],"at":[146,210,243],"running":[147,165],"speeds.":[148],"Policies":[149],"can":[150],"be":[151],"learned":[152],"only":[154],"few":[156],"million":[157],"even":[160],"challenging":[162],"tasks":[163],"over":[166,172,211,227],"terrain":[168],"loads":[170],"100%":[173],"nominal":[176,231,255],"mass.":[178,233,257],"Training":[179],"occurs":[180],"PyBullet,":[182],"perform":[185],"sim-to-sim":[187],"Gazebo":[190],"Unitree":[196,237],"A1":[197,238],"hardware.":[198],"For":[199,234],"sim-to-sim,":[200],"our":[201],"results":[202],"show":[203],"is":[206,226,239],"able":[207,240],"run":[209],"4":[212],"m/s":[213,219,245],"without":[214],"load,":[216,224,250],"3.5":[218],"10":[222],"kg":[223,249],"which":[225],"83%":[228],"sim-to-real,":[235],"bound":[242],"2":[244],"5":[248],"representing":[251],"42%":[252]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":19},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
