{"id":"https://openalex.org/W4413244285","doi":"https://doi.org/10.1145/3747865","title":"Walk This Way: Imitation-free Reinforcement Learning of Flexibly-Constrained Walking Controllers 60","display_name":"Walk This Way: Imitation-free Reinforcement Learning of Flexibly-Constrained Walking Controllers 60","publication_year":2025,"publication_date":"2025-08-08","ids":{"openalex":"https://openalex.org/W4413244285","doi":"https://doi.org/10.1145/3747865"},"language":"en","primary_location":{"id":"doi:10.1145/3747865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3747865","pdf_url":null,"source":{"id":"https://openalex.org/S4210220973","display_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","issn_l":"2577-6193","issn":["2577-6193"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3747865","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004995695","display_name":"Tiffany Matth\u00e9","orcid":"https://orcid.org/0000-0002-4121-1061"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tiffany Matth\u00e9","raw_affiliation_strings":["University of British Columbia","University of British Columbia, Vancouver, Canada"],"raw_orcid":"https://orcid.org/0000-0002-4121-1061","affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]},{"raw_affiliation_string":"University of British Columbia, Vancouver, Canada","institution_ids":["https://openalex.org/I141945490"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058983574","display_name":"N. Ioannidis","orcid":null},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Nicholas Ioannidis","raw_affiliation_strings":["University of British Columbia","University of British Columbia, Vancouver, Canada"],"raw_orcid":"https://orcid.org/0009-0009-4172-6151","affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]},{"raw_affiliation_string":"University of British Columbia, Vancouver, Canada","institution_ids":["https://openalex.org/I141945490"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052748246","display_name":"Michiel van de Panne","orcid":"https://orcid.org/0000-0002-9123-3672"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Michiel van de Panne","raw_affiliation_strings":["University of British Columbia","University of British Columbia, Vancouver, Canada"],"raw_orcid":"https://orcid.org/0000-0002-9123-3672","affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]},{"raw_affiliation_string":"University of British Columbia, Vancouver, Canada","institution_ids":["https://openalex.org/I141945490"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21823913,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"8","issue":"4","first_page":"1","last_page":"19"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.8089895248413086},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.793643593788147},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7009291648864746},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6242201328277588},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6122910976409912},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6011088490486145},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4686379134654999},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4549930989742279},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.44807884097099304},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4233455955982208}],"concepts":[{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.8089895248413086},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.793643593788147},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7009291648864746},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6242201328277588},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6122910976409912},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6011088490486145},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4686379134654999},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4549930989742279},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.44807884097099304},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4233455955982208},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3747865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3747865","pdf_url":null,"source":{"id":"https://openalex.org/S4210220973","display_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","issn_l":"2577-6193","issn":["2577-6193"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3747865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3747865","pdf_url":null,"source":{"id":"https://openalex.org/S4210220973","display_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","issn_l":"2577-6193","issn":["2577-6193"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Computer Graphics and Interactive Techniques","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3598631485","display_name":null,"funder_award_id":"594644","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1983098320","https://openalex.org/W2003584832","https://openalex.org/W2039630509","https://openalex.org/W2140190473","https://openalex.org/W2739330054","https://openalex.org/W2784449021","https://openalex.org/W2796290181","https://openalex.org/W2984579799","https://openalex.org/W2987886924","https://openalex.org/W3034664137","https://openalex.org/W3093481944","https://openalex.org/W3104515094","https://openalex.org/W3105609823","https://openalex.org/W3108412994","https://openalex.org/W3147968035","https://openalex.org/W3181074849","https://openalex.org/W3193778841","https://openalex.org/W4226072218","https://openalex.org/W4229081732","https://openalex.org/W4255703114","https://openalex.org/W4256615025","https://openalex.org/W4285981737","https://openalex.org/W4312606126","https://openalex.org/W4313563049","https://openalex.org/W4328028361","https://openalex.org/W4383108816","https://openalex.org/W4386066131","https://openalex.org/W4386142062","https://openalex.org/W4390874171","https://openalex.org/W4401793915","https://openalex.org/W4404526366","https://openalex.org/W4405395255","https://openalex.org/W4405785534"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W2665305151"],"abstract_inverted_index":{"Locomotion":[0],"is":[1],"fundamental":[2],"to":[3,90,160],"the":[4,96,137,151],"repertoire":[5],"of":[6,9,30,66,79,130,139,155],"skills":[7],"required":[8],"physics-based":[10],"human-like":[11],"characters.":[12],"Control":[13],"policies":[14],"are":[15],"most":[16],"commonly":[17],"developed":[18],"using":[19,24,50,156],"reinforcement":[20],"learning":[21,53],"(RL)":[22],"and":[23,84,92,100,108,115,153,163],"reward":[25],"functions":[26],"based":[27],"on":[28],"imitation":[29],"motion":[31],"capture":[32],"data.":[33],"In":[34],"this":[35,122],"work,":[36],"we":[37,119,134],"propose":[38],"an":[39],"imitation-free":[40,71,123,157],"RL":[41,72,124,158],"training":[42],"pipeline":[43,125],"for":[44,144],"bipedal":[45],"locomotion":[46,165],"controllers,":[47],"as":[48],"achieved":[49],"a":[51,63,75,128,140],"multistage":[52],"curriculum.":[54],"Our":[55,148],"work":[56],"makes":[57],"several":[58],"contributions.":[59],"First,":[60],"it":[61],"introduces":[62],"minimal":[64],"set":[65],"additional":[67],"specifications":[68],"so":[69],"that":[70,121,136],"can":[73],"learn":[74],"single":[76],"policy":[77],"capable":[78],"in-place":[80],"turning,":[81],"side-stepping,":[82],"hopping,":[83],"one-step":[85],"foot":[86],"plants,":[87],"in":[88],"addition":[89],"forwards":[91],"backwards":[93],"walking.":[94],"Second,":[95],"method":[97],"offers":[98],"precise":[99],"flexible":[101,162],"conditioning,":[102],"with":[103],"control":[104,111],"over":[105,112],"footstep":[106,113,116],"locations":[107],"further":[109],"optional":[110],"timing,":[114],"orientation.":[117],"Third,":[118],"demonstrate":[120,150],"works":[126],"across":[127],"range":[129],"body":[131],"morphologies.":[132],"Last,":[133],"show":[135],"use":[138],"plasticity-preservation":[141],"technique":[142],"allows":[143],"significantly":[145],"faster":[146],"learning.":[147],"results":[149],"scalability":[152],"effectiveness":[154],"approaches":[159],"develop":[161],"highly-directable":[164],"policies.":[166]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
