{"id":"https://openalex.org/W3001997350","doi":"https://doi.org/10.1109/robio49542.2019.8961651","title":"Learning a Faster Locomotion Gait for a Quadruped Robot with Model-Free Deep Reinforcement Learning","display_name":"Learning a Faster Locomotion Gait for a Quadruped Robot with Model-Free Deep Reinforcement Learning","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3001997350","doi":"https://doi.org/10.1109/robio49542.2019.8961651","mag":"3001997350"},"language":"en","primary_location":{"id":"doi:10.1109/robio49542.2019.8961651","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio49542.2019.8961651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101598277","display_name":"Biao Hu","orcid":"https://orcid.org/0000-0002-8968-7229"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Biao Hu","raw_affiliation_strings":["Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","institution_ids":["https://openalex.org/I75390827"]},{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044872738","display_name":"Shibo Shao","orcid":"https://orcid.org/0009-0009-6275-9737"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shibo Shao","raw_affiliation_strings":["Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","institution_ids":["https://openalex.org/I75390827"]},{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079155612","display_name":"Zhengcai Cao","orcid":"https://orcid.org/0000-0003-0344-0207"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengcai Cao","raw_affiliation_strings":["Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","institution_ids":["https://openalex.org/I75390827"]},{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101535525","display_name":"Qing Xiao","orcid":"https://orcid.org/0000-0002-0649-5361"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Xiao","raw_affiliation_strings":["Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Chemical Technology,College of Information Science and Technology,Beijing,China,100029","institution_ids":["https://openalex.org/I75390827"]},{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084789209","display_name":"Qunzhi Li","orcid":null},"institutions":[{"id":"https://openalex.org/I194716290","display_name":"China Academy of Space Technology","ror":"https://ror.org/025397a59","country_code":"CN","type":"government","lineage":["https://openalex.org/I194716290","https://openalex.org/I2802615301"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qunzhi Li","raw_affiliation_strings":["Beijing Institute of Spacecraft System Engineering,Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications,Beijing,China","Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications, Beijing Institute of Spacecraft System Engineering, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Spacecraft System Engineering,Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications,Beijing,China","institution_ids":["https://openalex.org/I194716290"]},{"raw_affiliation_string":"Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications, Beijing Institute of Spacecraft System Engineering, Beijing, China","institution_ids":["https://openalex.org/I194716290"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074711543","display_name":"Chao Ma","orcid":"https://orcid.org/0000-0002-3325-7318"},"institutions":[{"id":"https://openalex.org/I194716290","display_name":"China Academy of Space Technology","ror":"https://ror.org/025397a59","country_code":"CN","type":"government","lineage":["https://openalex.org/I194716290","https://openalex.org/I2802615301"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Ma","raw_affiliation_strings":["Beijing Institute of Spacecraft System Engineering,Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications,Beijing,China","Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications, Beijing Institute of Spacecraft System Engineering, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Spacecraft System Engineering,Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications,Beijing,China","institution_ids":["https://openalex.org/I194716290"]},{"raw_affiliation_string":"Beijing Key Laboratory of Intelligent Space Robotic Systems Technology and Applications, Beijing Institute of Spacecraft System Engineering, Beijing, China","institution_ids":["https://openalex.org/I194716290"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101598277"],"corresponding_institution_ids":["https://openalex.org/I75390827"],"apc_list":null,"apc_paid":null,"fwci":0.5869,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.66031921,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1097","last_page":"1102"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9621999859809875,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9473000168800354,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8497861623764038},{"id":"https://openalex.org/keywords/gait","display_name":"Gait","score":0.7499655485153198},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7032832503318787},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6594876050949097},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.644554853439331},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5604478716850281},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.5360085964202881},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.487813264131546},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.42265844345092773},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3568449318408966},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.23036199808120728},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06748482584953308}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8497861623764038},{"id":"https://openalex.org/C151800584","wikidata":"https://www.wikidata.org/wiki/Q2370000","display_name":"Gait","level":2,"score":0.7499655485153198},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7032832503318787},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6594876050949097},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.644554853439331},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5604478716850281},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.5360085964202881},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.487813264131546},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.42265844345092773},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3568449318408966},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.23036199808120728},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06748482584953308},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C42407357","wikidata":"https://www.wikidata.org/wiki/Q521","display_name":"Physiology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio49542.2019.8961651","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio49542.2019.8961651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1757796397","https://openalex.org/W1978102433","https://openalex.org/W1997576152","https://openalex.org/W2003889080","https://openalex.org/W2044976320","https://openalex.org/W2053881671","https://openalex.org/W2070153717","https://openalex.org/W2139053308","https://openalex.org/W2529573675","https://openalex.org/W2726187156","https://openalex.org/W2885878928","https://openalex.org/W2897143854","https://openalex.org/W2911087563","https://openalex.org/W2936971746","https://openalex.org/W2963184939","https://openalex.org/W2967118761","https://openalex.org/W2967236418","https://openalex.org/W2990123902","https://openalex.org/W4236829764","https://openalex.org/W4298857966","https://openalex.org/W6637967152","https://openalex.org/W6661730226","https://openalex.org/W6740222838","https://openalex.org/W6755645881"],"related_works":["https://openalex.org/W1992962589","https://openalex.org/W3032871857","https://openalex.org/W1743191351","https://openalex.org/W3104633800","https://openalex.org/W3023567978","https://openalex.org/W3044778482","https://openalex.org/W3040494141","https://openalex.org/W4384026392","https://openalex.org/W1977229594","https://openalex.org/W2072400776"],"abstract_inverted_index":{"Quadruped":[0],"robots":[1,20],"have":[2],"great":[3],"agility,":[4],"flexibility":[5],"and":[6,38,55,121,127],"stability,":[7],"which":[8],"enables":[9],"them":[10],"to":[11,46,75,104],"walk":[12],"through":[13],"uneven":[14],"terrain.":[15],"Motion":[16],"control":[17],"of":[18,79,99,118],"legged":[19],"is":[21,156],"always":[22],"a":[23,31,48,84,91],"difficult":[24],"problem.":[25],"Previous":[26],"approaches":[27],"mostly":[28],"either":[29],"use":[30,42],"predefined":[32],"gait":[33,49,78,89,151,162],"that":[34,51,67,133,155],"results":[35,131],"in":[36],"clumsy":[37],"unnatural":[39],"behavior,":[40],"or":[41],"reinforcement":[43,70,142],"learning":[44,71,128,143],"approach":[45,66,95,113,136],"generate":[47],"strategy":[50],"needs":[52],"longtime":[53],"computation":[54],"elegant":[56],"network":[57,124],"design.":[58],"In":[59],"this":[60,94],"paper,":[61],"we":[62],"present":[63],"an":[64],"effective":[65],"uses":[68],"deep":[69,141],"with":[72],"prior":[73,146],"knowledge":[74],"optimize":[76,105],"the":[77,97,106,160],"quadruped":[80,86],"robot.":[81],"By":[82],"using":[83],"specific":[85],"robot":[87],"walking":[88],"as":[90],"priori":[92],"knowledge,":[93],"adopts":[96],"technique":[98],"distributed":[100],"proximal":[101],"policy":[102],"optimization":[103],"search":[107],"for":[108],"better":[109],"gait.":[110],"The":[111],"proposed":[112,135],"does":[114],"not":[115],"require":[116],"modelling":[117],"complex":[119],"robots,":[120],"has":[122,152],"good":[123],"convergence":[125],"speed":[126,154],"effect.":[129],"Simulation":[130],"demonstrate":[132],"our":[134,149],"converges":[137],"faster":[138,158],"than":[139,159],"other":[140],"methods":[144],"without":[145,163],"knowledge.":[147],"Besides,":[148],"achieved":[150],"higher":[153],"50%":[157],"trot":[161],"optimization.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
