{"id":"https://openalex.org/W7131875871","doi":"https://doi.org/10.1109/sii64115.2026.11404550","title":"Towards Torque-Driven Reinforcement Learning for Quadruped Locomotion","display_name":"Towards Torque-Driven Reinforcement Learning for Quadruped Locomotion","publication_year":2026,"publication_date":"2026-01-11","ids":{"openalex":"https://openalex.org/W7131875871","doi":"https://doi.org/10.1109/sii64115.2026.11404550"},"language":null,"primary_location":{"id":"doi:10.1109/sii64115.2026.11404550","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sii64115.2026.11404550","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/SICE International Symposium on System Integration (SII)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099517731","display_name":"Jordan Dowdy","orcid":"https://orcid.org/0009-0000-4374-6943"},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jordan Dowdy","raw_affiliation_strings":["University of Louisville,Department of Electrical and Computer Engineering"],"affiliations":[{"raw_affiliation_string":"University of Louisville,Department of Electrical and Computer Engineering","institution_ids":["https://openalex.org/I142740786"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033596369","display_name":"Jean Chagas Vaz","orcid":"https://orcid.org/0000-0002-2934-8209"},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jean Chagas Vaz","raw_affiliation_strings":["University of Louisville,Faculty of Electrical and Computer Engineering,Louisville,KY,USA,40208"],"affiliations":[{"raw_affiliation_string":"University of Louisville,Faculty of Electrical and Computer Engineering,Louisville,KY,USA,40208","institution_ids":["https://openalex.org/I142740786"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5099517731"],"corresponding_institution_ids":["https://openalex.org/I142740786"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.94049861,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1259","last_page":"1264"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.41609999537467957,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.41609999537467957,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.23330000042915344,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.1559000015258789,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/traverse","display_name":"Traverse","score":0.906499981880188},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7914000153541565},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.7336999773979187},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6137999892234802},{"id":"https://openalex.org/keywords/torque","display_name":"Torque","score":0.5224999785423279},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4447999894618988},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4422000050544739},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.436599999666214}],"concepts":[{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.906499981880188},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7914000153541565},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.7336999773979187},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6137999892234802},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6121000051498413},{"id":"https://openalex.org/C144171764","wikidata":"https://www.wikidata.org/wiki/Q48103","display_name":"Torque","level":2,"score":0.5224999785423279},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4447999894618988},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4422000050544739},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.436599999666214},{"id":"https://openalex.org/C89992363","wikidata":"https://www.wikidata.org/wiki/Q5961558","display_name":"Track (disk drive)","level":2,"score":0.41679999232292175},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.41200000047683716},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4052000045776367},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.37139999866485596},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.36880001425743103},{"id":"https://openalex.org/C2777295749","wikidata":"https://www.wikidata.org/wiki/Q12511","display_name":"Stairs","level":2,"score":0.36489999294281006},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.36329999566078186},{"id":"https://openalex.org/C6101204","wikidata":"https://www.wikidata.org/wiki/Q7353391","display_name":"Robot locomotion","level":5,"score":0.36010000109672546},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.33559998869895935},{"id":"https://openalex.org/C145565327","wikidata":"https://www.wikidata.org/wiki/Q852514","display_name":"Motion control","level":3,"score":0.33239999413490295},{"id":"https://openalex.org/C136434205","wikidata":"https://www.wikidata.org/wiki/Q3437269","display_name":"Hexapod","level":3,"score":0.3190999925136566},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3131999969482422},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2881999909877777}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/sii64115.2026.11404550","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sii64115.2026.11404550","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/SICE International Symposium on System Integration (SII)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2783173101","https://openalex.org/W3011016396","https://openalex.org/W3134580056","https://openalex.org/W3207033168","https://openalex.org/W3212580602","https://openalex.org/W4383108873","https://openalex.org/W4389352651","https://openalex.org/W4390481291","https://openalex.org/W4392945120","https://openalex.org/W4405180201","https://openalex.org/W4411550967"],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1],"(RL)":[2],"for":[3,61,76],"legged":[4],"robots":[5],"is":[6],"advancing":[7],"locomotion,":[8],"demonstrating":[9],"its":[10],"ability":[11],"to":[12,14,31,65],"adapt":[13],"new":[15],"and":[16,34,90,109,132,142],"challenging":[17],"terrain.":[18],"Traditionally,":[19],"these":[20,47],"RL":[21,48,72,81,116],"locomotion":[22],"frameworks":[23,49],"are":[24,56,120],"position-based,":[25],"making":[26],"the":[27,40,101,115,123,137,146],"policy":[28,119],"less":[29],"adaptable":[30],"terrain":[32,89],"types":[33],"requiring":[35,98],"state":[36],"estimation":[37],"techniques":[38],"in":[39,58,83],"observation":[41],"space,":[42],"i.e.,":[43],"linear":[44,95],"velocity.":[45,104],"Moreover,":[46],"often":[50],"use":[51],"small,":[52],"lightweight":[53],"quadrupeds":[54],"that":[55],"limited":[57],"their":[59],"viability":[60],"high-complexity":[62],"tasks":[63],"due":[64],"hardware":[66],"constraints.":[67],"This":[68],"work":[69],"explores":[70],"an":[71,149],"torque":[73,117],"control":[74,118],"framework":[75,82],"heavyweight":[77],"high-torque":[78],"quadrupeds.":[79],"The":[80],"this":[84],"paper":[85],"can":[86,139],"traverse":[87],"rough":[88],"effectively":[91],"track":[92],"a":[93],"desired":[94],"velocity":[96],"without":[97,145],"knowledge":[99],"of":[100,114,129,148],"agent\u2019s":[102],"current":[103],"Using":[105],"Nvidia\u2019s":[106],"Isaac":[107,110],"Sim":[108],"Lab,":[111],"simulation":[112],"results":[113],"shown":[121],"on":[122],"Unitree":[124],"B1":[125],"quadruped,":[126],"achieving":[127],"speeds":[128],"3.5":[130],"m/s":[131],"1.5":[133],"rad/s.":[134],"In":[135],"addition,":[136],"quadruped":[138],"walk":[140],"up":[141],"down":[143],"stairs":[144],"aid":[147],"exteroceptive":[150],"sensor.":[151]},"counts_by_year":[],"updated_date":"2026-03-01T06:05:34.837733","created_date":"2026-02-28T00:00:00"}
