{"id":"https://openalex.org/W4385696305","doi":"https://doi.org/10.1109/lra.2023.3303786","title":"Reinforcement Learning With Energy-Exchange Dynamics for Spring-Loaded Biped Robot Walking","display_name":"Reinforcement Learning With Energy-Exchange Dynamics for Spring-Loaded Biped Robot Walking","publication_year":2023,"publication_date":"2023-08-09","ids":{"openalex":"https://openalex.org/W4385696305","doi":"https://doi.org/10.1109/lra.2023.3303786"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2023.3303786","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lra.2023.3303786","pdf_url":"https://ieeexplore.ieee.org/ielx7/7083369/7339444/10214113.pdf","source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/7083369/7339444/10214113.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070668609","display_name":"Cheng-Yu Kuo","orcid":"https://orcid.org/0000-0002-3085-0343"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Cheng-Yu Kuo","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","Graduated School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3085-0343","affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Graduated School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079727582","display_name":"Hirofumi Shin","orcid":null},"institutions":[{"id":"https://openalex.org/I1283473643","display_name":"Honda (Japan)","ror":"https://ror.org/03jzay846","country_code":"JP","type":"company","lineage":["https://openalex.org/I1283473643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirofumi Shin","raw_affiliation_strings":["Honda R&amp;D, Ltd., Saitama, Japan"],"raw_orcid":"https://orcid.org/0000-0003-0265-3710","affiliations":[{"raw_affiliation_string":"Honda R&amp;D, Ltd., Saitama, Japan","institution_ids":["https://openalex.org/I1283473643"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042074952","display_name":"Takamitsu Matsubara","orcid":"https://orcid.org/0000-0003-3545-4814"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takamitsu Matsubara","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","Graduated School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan"],"raw_orcid":"https://orcid.org/0000-0003-3545-4814","affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Graduated School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5070668609"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":0.7304,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.66632487,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"8","issue":"10","first_page":"6243","last_page":"6250"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10409","display_name":"Fuel Cells and Related Materials","score":0.9772999882698059,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9358999729156494,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8032991886138916},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.6350957751274109},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6177909970283508},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5622586607933044},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.49580392241477966},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.487528532743454},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.4548493027687073},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.454037606716156},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.4511595666408539},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4401947557926178},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3689868450164795},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.1185917854309082},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10212355852127075}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8032991886138916},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.6350957751274109},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6177909970283508},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5622586607933044},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.49580392241477966},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.487528532743454},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.4548493027687073},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.454037606716156},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.4511595666408539},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4401947557926178},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3689868450164795},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.1185917854309082},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10212355852127075},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2023.3303786","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lra.2023.3303786","pdf_url":"https://ieeexplore.ieee.org/ielx7/7083369/7339444/10214113.pdf","source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/lra.2023.3303786","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lra.2023.3303786","pdf_url":"https://ieeexplore.ieee.org/ielx7/7083369/7339444/10214113.pdf","source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.4699999988079071}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385696305.pdf","grobid_xml":"https://content.openalex.org/works/W4385696305.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W770013183","https://openalex.org/W1999050977","https://openalex.org/W2152842312","https://openalex.org/W3038822267","https://openalex.org/W3088662645","https://openalex.org/W3091094690","https://openalex.org/W3135263265","https://openalex.org/W3136025385","https://openalex.org/W3136437429","https://openalex.org/W3206620955","https://openalex.org/W3206762371","https://openalex.org/W3211835026","https://openalex.org/W4206679659","https://openalex.org/W4221142099","https://openalex.org/W4248446246","https://openalex.org/W4285102540","https://openalex.org/W4313562933","https://openalex.org/W4313563020","https://openalex.org/W4313563129","https://openalex.org/W4313598692","https://openalex.org/W6676801769","https://openalex.org/W6680657880","https://openalex.org/W6681631837","https://openalex.org/W6740033195"],"related_works":["https://openalex.org/W2118717649","https://openalex.org/W2413243053","https://openalex.org/W410723623","https://openalex.org/W2015341305","https://openalex.org/W2035068594","https://openalex.org/W4225593417","https://openalex.org/W2573498121","https://openalex.org/W3022298670","https://openalex.org/W3160494304","https://openalex.org/W3006162251"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,17,74,79,100,140,152],"probabilistic":[4],"Model-based":[5],"Reinforcement":[6],"Learning":[7],"(MBRL)":[8],"approach":[9,22,98],"for":[10,119],"learning":[11,117,150],"the":[12,42,48,51,69,84,115],"Energy-exchange":[13],"Dynamics":[14],"(EED)":[15],"of":[16,47,53,86,88],"spring-loaded":[18,102],"biped":[19,103],"robot.":[20],"Our":[21],"enables":[23],"on-site":[24,136,149],"walking":[25,80,121,128,137],"acquisition":[26,129,138],"with":[27,55,68,130,139],"high":[28],"sample":[29],"efficiency,":[30],"real-time":[31,146],"planning":[32,66],"capability,":[33],"and":[34,90,107,109,123,127,148],"generalizability":[35,110],"across":[36],"skill":[37],"conditions.":[38],"Specifically,":[39],"we":[40,72],"learn":[41],"data-driven":[43],"state":[44],"transition":[45],"dynamics":[46,143],"robot":[49,104],"in":[50,105,125],"formulation":[52],"energy-states,":[54],"their":[56],"interaction":[57],"characterized":[58],"as":[59],"energy-exchange":[60],"to":[61],"reduce":[62],"dimensionality.":[63],"To":[64],"improve":[65],"reliability":[67],"learned":[70],"EED,":[71],"design":[73],"control":[75],"space":[76],"based":[77],"on":[78],"trajectory":[81],"that":[82],"follows":[83],"law":[85],"conservation":[87],"energy":[89],"is":[91,111],"formulated":[92],"by":[93,113],"energy-states.":[94],"We":[95],"evaluated":[96],"our":[97],"using":[99,114],"four-degree-of-freedom":[101],"simulation":[106,126],"hardware,":[108],"validated":[112],"same":[116],"framework":[118],"different":[120],"speeds":[122],"terrains":[124],"hardware.":[131],"All":[132],"results":[133],"showed":[134],"successful":[135],"compact":[141],"nine-dimension":[142],"model,":[144],"40Hz":[145],"planning,":[147],"within":[151],"few":[153],"minutes.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-23T08:51:43.019350","created_date":"2025-10-10T00:00:00"}
