{"id":"https://openalex.org/W4394674699","doi":"https://doi.org/10.1126/scirobotics.adi8022","title":"Learning agile soccer skills for a bipedal robot with deep reinforcement learning","display_name":"Learning agile soccer skills for a bipedal robot with deep reinforcement learning","publication_year":2024,"publication_date":"2024-04-10","ids":{"openalex":"https://openalex.org/W4394674699","doi":"https://doi.org/10.1126/scirobotics.adi8022","pmid":"https://pubmed.ncbi.nlm.nih.gov/38598610"},"language":"en","primary_location":{"id":"doi:10.1126/scirobotics.adi8022","is_oa":false,"landing_page_url":"https://doi.org/10.1126/scirobotics.adi8022","pdf_url":null,"source":{"id":"https://openalex.org/S4210213233","display_name":"Science Robotics","issn_l":"2470-9476","issn":["2470-9476"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315823","host_organization_name":"American Association for the Advancement of Science","host_organization_lineage":["https://openalex.org/P4310315823"],"host_organization_lineage_names":["American Association for the Advancement of Science"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Science Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030073861","display_name":"Tuomas Haarnoja","orcid":"https://orcid.org/0009-0007-2973-9246"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Tuomas Haarnoja","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0009-0007-2973-9246","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044463979","display_name":"Ben Moran","orcid":"https://orcid.org/0000-0002-9254-662X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Ben Moran","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-9254-662X","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031943811","display_name":"Guy Lever","orcid":"https://orcid.org/0000-0001-9551-1839"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Guy Lever","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0001-9551-1839","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082738872","display_name":"Sandy H. Huang","orcid":"https://orcid.org/0000-0001-8920-2247"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Sandy H. Huang","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0001-8920-2247","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005912318","display_name":"Dhruva Tirumala","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Dhruva Tirumala","raw_affiliation_strings":["Google DeepMind, London, UK","University College London, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]},{"raw_affiliation_string":"University College London, London, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102771619","display_name":"Jan Humplik","orcid":"https://orcid.org/0000-0002-7573-7635"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jan Humplik","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002747297","display_name":"Markus Wulfmeier","orcid":"https://orcid.org/0000-0003-1802-4492"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Markus Wulfmeier","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0003-1802-4492","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077653936","display_name":"Saran Tunyasuvunakool","orcid":"https://orcid.org/0000-0002-1620-6797"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Saran Tunyasuvunakool","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-1620-6797","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065489996","display_name":"Noah Siegel","orcid":"https://orcid.org/0000-0002-5746-117X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Noah Y. Siegel","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-5746-117X","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018196238","display_name":"Roland Hafner","orcid":"https://orcid.org/0000-0001-8061-8828"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Roland Hafner","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0001-8061-8828","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004482443","display_name":"Michael Bloesch","orcid":"https://orcid.org/0000-0002-2171-696X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Michael Bloesch","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-2171-696X","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078419629","display_name":"Kristian Hartikainen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kristian Hartikainen","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037305533","display_name":"Arunkumar Byravan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Arunkumar Byravan","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014567358","display_name":"Leonard Hasenclever","orcid":"https://orcid.org/0000-0003-1844-696X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Leonard Hasenclever","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0003-1844-696X","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008259889","display_name":"Yuval Tassa","orcid":"https://orcid.org/0000-0002-1197-288X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yuval Tassa","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-1197-288X","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006431582","display_name":"Fereshteh Sadeghi","orcid":"https://orcid.org/0000-0003-4058-5261"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Fereshteh Sadeghi","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010818667","display_name":"Nathan Batchelor","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nathan Batchelor","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028236088","display_name":"Federico Casarini","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Federico Casarini","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039840350","display_name":"Stefano Saliceti","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Stefano Saliceti","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071434961","display_name":"Charles Game","orcid":"https://orcid.org/0009-0004-6402-3014"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Charles Game","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0009-0004-6402-3014","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054501100","display_name":"Neil Sreendra","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210155811","display_name":"Interactive Research and Development","ror":"https://ror.org/04mccvy52","country_code":"PK","type":"nonprofit","lineage":["https://openalex.org/I4210155811"]}],"countries":["GB","PK"],"is_corresponding":false,"raw_author_name":"Neil Sreendra","raw_affiliation_strings":["Google DeepMind, London, UK","Proactive Global, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]},{"raw_affiliation_string":"Proactive Global, London, UK","institution_ids":["https://openalex.org/I4210155811"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090567851","display_name":"Kushal Patel","orcid":"https://orcid.org/0000-0003-3763-3998"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210155811","display_name":"Interactive Research and Development","ror":"https://ror.org/04mccvy52","country_code":"PK","type":"nonprofit","lineage":["https://openalex.org/I4210155811"]}],"countries":["GB","PK"],"is_corresponding":false,"raw_author_name":"Kushal Patel","raw_affiliation_strings":["Google DeepMind, London, UK","Proactive Global, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]},{"raw_affiliation_string":"Proactive Global, London, UK","institution_ids":["https://openalex.org/I4210155811"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074380892","display_name":"Marlon Gwira","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210155811","display_name":"Interactive Research and Development","ror":"https://ror.org/04mccvy52","country_code":"PK","type":"nonprofit","lineage":["https://openalex.org/I4210155811"]}],"countries":["GB","PK"],"is_corresponding":false,"raw_author_name":"Marlon Gwira","raw_affiliation_strings":["Google DeepMind, London, UK","Proactive Global, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]},{"raw_affiliation_string":"Proactive Global, London, UK","institution_ids":["https://openalex.org/I4210155811"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102705108","display_name":"Andrea Huber","orcid":"https://orcid.org/0000-0002-4431-8171"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrea Huber","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-4431-8171","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062886897","display_name":"Nicole Hurley","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nicole Hurley","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063532849","display_name":"Francesco Nori","orcid":"https://orcid.org/0000-0003-3763-6873"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Francesco Nori","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0003-3763-6873","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079415139","display_name":"Raia Hadsell","orcid":"https://orcid.org/0000-0002-2390-1771"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Raia Hadsell","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0002-2390-1771","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062951341","display_name":"Nicolas Heess","orcid":"https://orcid.org/0000-0001-7876-9256"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I4210113297","display_name":"Google (United Kingdom)","ror":"https://ror.org/024bc3e07","country_code":"GB","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210113297","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nicolas Heess","raw_affiliation_strings":["Google DeepMind, London, UK"],"raw_orcid":"https://orcid.org/0000-0001-7876-9256","affiliations":[{"raw_affiliation_string":"Google DeepMind, London, UK","institution_ids":["https://openalex.org/I4210113297","https://openalex.org/I4210090411"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":28,"corresponding_author_ids":["https://openalex.org/A5030073861","https://openalex.org/A5031943811","https://openalex.org/A5044463979","https://openalex.org/A5082738872"],"corresponding_institution_ids":["https://openalex.org/I4210090411","https://openalex.org/I4210113297"],"apc_list":null,"apc_paid":null,"fwci":23.7652,"has_fulltext":false,"cited_by_count":147,"citation_normalized_percentile":{"value":0.99875265,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"9","issue":"89","first_page":"eadi8022","last_page":"eadi8022"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8184840083122253},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6791788935661316},{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.6146488189697266},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5789185762405396},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5761482119560242},{"id":"https://openalex.org/keywords/throwing","display_name":"Throwing","score":0.5638041496276855},{"id":"https://openalex.org/keywords/agile-software-development","display_name":"Agile software development","score":0.5556986927986145},{"id":"https://openalex.org/keywords/ball","display_name":"Ball (mathematics)","score":0.4922262728214264},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4553646445274353},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.44544804096221924},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35386067628860474},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2208012044429779},{"id":"https://openalex.org/keywords/aeronautics","display_name":"Aeronautics","score":0.09773433208465576}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8184840083122253},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6791788935661316},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.6146488189697266},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5789185762405396},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5761482119560242},{"id":"https://openalex.org/C207451115","wikidata":"https://www.wikidata.org/wiki/Q12898216","display_name":"Throwing","level":2,"score":0.5638041496276855},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.5556986927986145},{"id":"https://openalex.org/C122041747","wikidata":"https://www.wikidata.org/wiki/Q838611","display_name":"Ball (mathematics)","level":2,"score":0.4922262728214264},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4553646445274353},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.44544804096221924},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35386067628860474},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2208012044429779},{"id":"https://openalex.org/C178802073","wikidata":"https://www.wikidata.org/wiki/Q8421","display_name":"Aeronautics","level":1,"score":0.09773433208465576},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D012916","descriptor_name":"Soccer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012916","descriptor_name":"Soccer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012916","descriptor_name":"Soccer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012916","descriptor_name":"Soccer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012916","descriptor_name":"Soccer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016138","descriptor_name":"Walking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016138","descriptor_name":"Walking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016138","descriptor_name":"Walking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016138","descriptor_name":"Walking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016138","descriptor_name":"Walking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1126/scirobotics.adi8022","is_oa":false,"landing_page_url":"https://doi.org/10.1126/scirobotics.adi8022","pdf_url":null,"source":{"id":"https://openalex.org/S4210213233","display_name":"Science Robotics","issn_l":"2470-9476","issn":["2470-9476"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315823","host_organization_name":"American Association for the Advancement of Science","host_organization_lineage":["https://openalex.org/P4310315823"],"host_organization_lineage_names":["American Association for the Advancement of Science"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Science Robotics","raw_type":"journal-article"},{"id":"pmid:38598610","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38598610","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Science robotics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":88,"referenced_works":["https://openalex.org/W153301390","https://openalex.org/W1495978126","https://openalex.org/W1931877416","https://openalex.org/W1945123189","https://openalex.org/W1977655452","https://openalex.org/W2034587361","https://openalex.org/W2100168570","https://openalex.org/W2102660061","https://openalex.org/W2104641222","https://openalex.org/W2105143952","https://openalex.org/W2105741987","https://openalex.org/W2109910161","https://openalex.org/W2117085697","https://openalex.org/W2125612430","https://openalex.org/W2127412976","https://openalex.org/W2141754131","https://openalex.org/W2144274908","https://openalex.org/W2145339207","https://openalex.org/W2158782408","https://openalex.org/W2161427949","https://openalex.org/W2162768030","https://openalex.org/W2205975260","https://openalex.org/W2739473244","https://openalex.org/W2750605955","https://openalex.org/W2762117857","https://openalex.org/W2762242067","https://openalex.org/W2785738552","https://openalex.org/W2788781499","https://openalex.org/W2796290181","https://openalex.org/W2889326414","https://openalex.org/W2905822515","https://openalex.org/W2907537824","https://openalex.org/W2911087563","https://openalex.org/W2911616846","https://openalex.org/W2913409451","https://openalex.org/W2914048451","https://openalex.org/W2946054758","https://openalex.org/W2954634850","https://openalex.org/W2973525135","https://openalex.org/W2982316857","https://openalex.org/W2992335548","https://openalex.org/W3003647188","https://openalex.org/W3007553593","https://openalex.org/W3024539867","https://openalex.org/W3034909023","https://openalex.org/W3036619998","https://openalex.org/W3039737909","https://openalex.org/W3040518754","https://openalex.org/W3041244724","https://openalex.org/W3046190872","https://openalex.org/W3080433414","https://openalex.org/W3093922502","https://openalex.org/W3096457737","https://openalex.org/W3104515094","https://openalex.org/W3104876774","https://openalex.org/W3126321819","https://openalex.org/W3164631379","https://openalex.org/W3167879406","https://openalex.org/W3175254947","https://openalex.org/W3176539729","https://openalex.org/W3184085787","https://openalex.org/W3212380917","https://openalex.org/W3213752693","https://openalex.org/W4200150166","https://openalex.org/W4205430897","https://openalex.org/W4205513846","https://openalex.org/W4226143977","https://openalex.org/W4283721947","https://openalex.org/W4283787029","https://openalex.org/W4287630848","https://openalex.org/W4297789683","https://openalex.org/W4309137642","https://openalex.org/W4311486620","https://openalex.org/W4312574175","https://openalex.org/W4312908419","https://openalex.org/W4317987839","https://openalex.org/W4360778240","https://openalex.org/W4383097455","https://openalex.org/W4383108204","https://openalex.org/W4383108291","https://openalex.org/W4383108493","https://openalex.org/W4383108925","https://openalex.org/W4385430486","https://openalex.org/W4385430550","https://openalex.org/W4385430644","https://openalex.org/W4389665855","https://openalex.org/W4390480981","https://openalex.org/W6930147935"],"related_works":["https://openalex.org/W2757445715","https://openalex.org/W4239855920","https://openalex.org/W2371249440","https://openalex.org/W2365576545","https://openalex.org/W3165347946","https://openalex.org/W4226007727","https://openalex.org/W2059660105","https://openalex.org/W2327671128","https://openalex.org/W2386414876","https://openalex.org/W3029718387"],"abstract_inverted_index":{"We":[0,31],"investigated":[1],"whether":[2],"deep":[3,33],"reinforcement":[4],"learning":[5],"(deep":[6],"RL)":[7],"is":[8],"able":[9],"to":[10,35,40,79,92,103,114,148],"synthesize":[11],"sophisticated":[12],"and":[13,52,63,65,73,83,112,127,151],"safe":[14],"movement":[15,54],"skills":[16],"for":[17],"a":[18,37,42,71,97,153,158],"low-cost,":[19],"miniature":[20],"humanoid":[21,38],"robot":[22,39],"that":[23,99],"can":[24],"be":[25,101],"composed":[26],"into":[27],"complex":[28],"behavioral":[29],"strategies.":[30],"used":[32],"RL":[34],"train":[36],"play":[41],"simplified":[43],"one-versus-one":[44],"soccer":[45],"game.":[46],"The":[47,87],"resulting":[48],"agent":[49,107,137],"exhibits":[50],"robust":[51],"dynamic":[53],"skills,":[55],"such":[56],"as":[57],"rapid":[58],"fall":[59],"recovery,":[60],"walking,":[61],"turning,":[62],"kicking,":[64],"it":[66],"transitions":[67],"between":[68],"them":[69],"in":[70,96,110],"smooth":[72],"efficient":[74],"manner.":[75],"It":[76],"also":[77],"learned":[78],"anticipate":[80],"ball":[81,154],"movements":[82],"block":[84],"opponent":[85],"shots.":[86],"agent's":[88],"tactical":[89],"behavior":[90],"adapts":[91],"specific":[93],"game":[94],"contexts":[95],"way":[98],"would":[100],"impractical":[102],"manually":[104],"design.":[105],"Our":[106],"was":[108],"trained":[109],"simulation":[111],"transferred":[113],"real":[115],"robots":[116],"zero-shot.":[117],"A":[118],"combination":[119],"of":[120],"sufficiently":[121],"high-frequency":[122],"control,":[123],"targeted":[124],"dynamics":[125],"randomization,":[126],"perturbations":[128],"during":[129],"training":[130],"enabled":[131],"good-quality":[132],"transfer.":[133],"In":[134],"experiments,":[135],"the":[136],"walked":[138],"181%":[139],"faster,":[140,143],"turned":[141],"302%":[142],"took":[144],"63%":[145],"less":[146],"time":[147],"get":[149],"up,":[150],"kicked":[152],"34%":[155],"faster":[156],"than":[157],"scripted":[159],"baseline.":[160]},"counts_by_year":[{"year":2026,"cited_by_count":16},{"year":2025,"cited_by_count":91},{"year":2024,"cited_by_count":35},{"year":2023,"cited_by_count":5}],"updated_date":"2026-05-26T13:28:51.108037","created_date":"2025-10-10T00:00:00"}
