{"id":"https://openalex.org/W4303647912","doi":"https://doi.org/10.1109/lra.2022.3211785","title":"Meta Reinforcement Learning for Optimal Design of Legged Robots","display_name":"Meta Reinforcement Learning for Optimal Design of Legged Robots","publication_year":2022,"publication_date":"2022-10-01","ids":{"openalex":"https://openalex.org/W4303647912","doi":"https://doi.org/10.1109/lra.2022.3211785"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2022.3211785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2022.3211785","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2210.02750","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047647638","display_name":"\u00c1lvaro Belmonte-Baeza","orcid":"https://orcid.org/0000-0001-9741-9497"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Alvaro Belmonte-Baeza","raw_affiliation_strings":["Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0001-9741-9497","affiliations":[{"raw_affiliation_string":"Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015754958","display_name":"Joonho Lee","orcid":"https://orcid.org/0000-0002-5072-7385"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joonho Lee","raw_affiliation_strings":["Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-5072-7385","affiliations":[{"raw_affiliation_string":"Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051485036","display_name":"Giorgio Valsecchi","orcid":"https://orcid.org/0000-0003-0595-3938"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giorgio Valsecchi","raw_affiliation_strings":["Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0003-0595-3938","affiliations":[{"raw_affiliation_string":"Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044258783","display_name":"Marco Hutter","orcid":"https://orcid.org/0000-0002-4285-4990"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marco Hutter","raw_affiliation_strings":["Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-4285-4990","affiliations":[{"raw_affiliation_string":"Robotic Systems Lab (RSL), ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047647638"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7166,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.83218635,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"7","issue":"4","first_page":"12134","last_page":"12141"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.882182240486145},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7081888914108276},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6704443693161011},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.533513069152832},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.508056640625},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.4707872271537781},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.45922011137008667},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.43579763174057007},{"id":"https://openalex.org/keywords/actuator","display_name":"Actuator","score":0.4174238443374634},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3978390395641327},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3330164849758148},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18794730305671692}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.882182240486145},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7081888914108276},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6704443693161011},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.533513069152832},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.508056640625},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.4707872271537781},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.45922011137008667},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.43579763174057007},{"id":"https://openalex.org/C172707124","wikidata":"https://www.wikidata.org/wiki/Q423488","display_name":"Actuator","level":2,"score":0.4174238443374634},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3978390395641327},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3330164849758148},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18794730305671692},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/lra.2022.3211785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2022.3211785","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2210.02750","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.02750","pdf_url":"https://arxiv.org/pdf/2210.02750","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2210.02750","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.02750","pdf_url":"https://arxiv.org/pdf/2210.02750","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.49000000953674316,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W205095828","https://openalex.org/W2008150460","https://openalex.org/W2047234459","https://openalex.org/W2111904757","https://openalex.org/W2112036188","https://openalex.org/W2117085697","https://openalex.org/W2561621263","https://openalex.org/W2604763608","https://openalex.org/W2736021157","https://openalex.org/W2736601468","https://openalex.org/W2764255492","https://openalex.org/W2779458783","https://openalex.org/W2788030459","https://openalex.org/W2788904251","https://openalex.org/W2911087563","https://openalex.org/W2968213087","https://openalex.org/W2984106353","https://openalex.org/W2985106077","https://openalex.org/W3047039444","https://openalex.org/W3093922502","https://openalex.org/W3104876774","https://openalex.org/W3106528330","https://openalex.org/W3148904829","https://openalex.org/W3191225206","https://openalex.org/W4200058106","https://openalex.org/W4205430897","https://openalex.org/W4214717370","https://openalex.org/W4298174377","https://openalex.org/W4300509833","https://openalex.org/W4312624212","https://openalex.org/W6685726866","https://openalex.org/W6736057607","https://openalex.org/W6741002519","https://openalex.org/W6748600884","https://openalex.org/W6912248530"],"related_works":["https://openalex.org/W1992962589","https://openalex.org/W3032871857","https://openalex.org/W1743191351","https://openalex.org/W2789522126","https://openalex.org/W2066693961","https://openalex.org/W3104633800","https://openalex.org/W2368363778","https://openalex.org/W3023567978","https://openalex.org/W122584421","https://openalex.org/W4244295168"],"abstract_inverted_index":{"The":[0],"process":[1],"of":[2,12,29,88,129],"robot":[3],"design":[4,13,35,38,70,115,119,155],"is":[5,33,110],"a":[6,69,98,165],"complex":[7],"task":[8,32],"and":[9,59,78,85,168],"the":[10,82,118,124,147],"majority":[11],"decisions":[14],"are":[15,40,49],"still":[16],"based":[17],"on":[18],"human":[19],"intuition":[20],"or":[21,56,183],"tedious":[22],"manual":[23],"tuning.":[24],"A":[25],"more":[26],"informed":[27],"way":[28],"facing":[30],"this":[31,65],"computational":[34],"methods":[36],"where":[37],"parameters":[39,87],"concurrently":[41],"optimized":[42],"with":[43],"corresponding":[44],"controllers.":[45],"Existing":[46],"approaches,":[47],"however,":[48],"strongly":[50],"influenced":[51],"by":[52,180],"predefined":[53,181],"control":[54,127],"rules":[55],"motion":[57],"templates":[58],"cannot":[60],"provide":[61],"end-to-end":[62],"solutions.":[63],"In":[64],"paper,":[66],"we":[67,144,160],"present":[68],"optimization":[71],"framework":[72],"using":[73],"model-free":[74],"meta":[75,93,148],"reinforcement":[76,94],"learning,":[77],"its":[79],"application":[80],"to":[81,96,105,112,132],"optimizing":[83],"kinematics":[84],"actuator":[86],"quadrupedal":[89],"robots.":[90],"We":[91,121],"use":[92],"learning":[95],"train":[97],"locomotion":[99],"policy":[100,109,125,149],"that":[101,123,146,170],"can":[102,126],"quickly":[103],"adapt":[104],"different":[106,130],"designs.":[107],"This":[108],"used":[111],"evaluate":[113],"each":[114,154],"instance":[116,156],"during":[117],"optimization.":[120],"demonstrate":[122],"robots":[128],"designs":[131],"track":[133],"random":[134],"velocity":[135],"commands":[136],"over":[137],"various":[138],"rough":[139],"terrains.":[140],"With":[141],"controlled":[142],"experiments,":[143],"show":[145,169],"achieves":[150],"close-to-optimal":[151],"performance":[152,175],"for":[153],"after":[157],"adaptation.":[158],"Lastly,":[159],"compare":[161],"our":[162,171],"results":[163],"against":[164],"model-based":[166],"baseline":[167],"approach":[172],"allows":[173],"higher":[174],"while":[176],"not":[177],"being":[178],"constrained":[179],"motions":[182],"gait":[184],"patterns.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":7}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
