{"id":"https://openalex.org/W4393553502","doi":"https://doi.org/10.5281/zenodo.7118519","title":"Figure Data for the paper \"Mastering the Game of Stratego with Model-Free Multiagent Reinforcement Learning\"","display_name":"Figure Data for the paper \"Mastering the Game of Stratego with Model-Free Multiagent Reinforcement Learning\"","publication_year":2022,"publication_date":"2022-10-31","ids":{"openalex":"https://openalex.org/W4393553502","doi":"https://doi.org/10.5281/zenodo.7118519"},"language":"en","primary_location":{"id":"pmh:oai:zenodo.org:7118519","is_oa":true,"landing_page_url":"https://zenodo.org/record/7118519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/7118519","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056707583","display_name":"Julien P\u00e9rolat","orcid":"https://orcid.org/0000-0002-8176-1666"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Perolat, Julien","raw_affiliation_strings":["DeepMind"],"raw_orcid":"https://orcid.org/0000-0002-8176-1666","affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027641103","display_name":"Bart De Vylder","orcid":"https://orcid.org/0000-0002-7833-4831"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"De Vylder, Bart","raw_affiliation_strings":["DeepMind"],"raw_orcid":"https://orcid.org/0000-0002-7833-4831","affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043984392","display_name":"Daniel Hennes","orcid":"https://orcid.org/0000-0002-3646-5286"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hennes, Daniel","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072903215","display_name":"Eugene Tarassov","orcid":"https://orcid.org/0000-0002-7330-860X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Tarassov, Eugene","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024394972","display_name":"Florian Strub","orcid":"https://orcid.org/0000-0001-7271-5345"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Strub, Florian","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048592673","display_name":"Vincent C. J. de Boer","orcid":"https://orcid.org/0000-0001-9928-1698"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"de Boer, Vincent","raw_affiliation_strings":["Independent consultant to DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Independent consultant to DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058922471","display_name":"Paul M\u00fcller","orcid":"https://orcid.org/0000-0002-5734-3130"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Muller, Paul","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041881668","display_name":"Jerome T. Connor","orcid":"https://orcid.org/0000-0002-7141-6260"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Connor, Jerome T.","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018555885","display_name":"Neil Burch","orcid":"https://orcid.org/0000-0002-4596-3690"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Burch, Neil","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000081835","display_name":"Thomas Anthony","orcid":"https://orcid.org/0000-0002-4443-5466"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Anthony, Thomas","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064779744","display_name":"Stephen McAleer","orcid":"https://orcid.org/0000-0003-0118-6874"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"McAleer, Stephen","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085971810","display_name":"Romuald \u00c9lie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Elie, Romuald","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112612157","display_name":"Sarah H. Cen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Cen, Sarah H.","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407597","display_name":"Zhe Wang","orcid":"https://orcid.org/0000-0002-0748-5376"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wang, Zhe","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040179074","display_name":"Audr\u016bnas Gruslys","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Gruslys, Audrunas","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073631643","display_name":"Aleksandra Malysheva","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Malysheva, Aleksandra","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061261923","display_name":"Mina Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Khan, Mina","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049332971","display_name":"Sherjil Ozair","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ozair, Sherjil","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090501025","display_name":"Finbarr Timbers","orcid":"https://orcid.org/0000-0001-9047-9542"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Timbers, Finbarr","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045681608","display_name":"Toby Pohlen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Pohlen, Toby","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019669511","display_name":"Tom Eccles","orcid":"https://orcid.org/0000-0001-6706-017X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Eccles, Tom","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108379405","display_name":"Mark Rowland","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Rowland, Mark","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049659586","display_name":"Marc Lanctot","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lanctot, Marc","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058299981","display_name":"Jean-Baptiste Lespiau","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lespiau, Jean-Baptiste","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103033215","display_name":"Bilal Piot","orcid":"https://orcid.org/0000-0003-3906-950X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Piot, Bilal","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052169592","display_name":"Shayegan Omidshafiei","orcid":"https://orcid.org/0000-0001-7758-1454"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Omidshafiei, Shayegan","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081026564","display_name":"Edward Lockhart","orcid":"https://orcid.org/0000-0001-8753-0765"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lockhart, Edward","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053301405","display_name":"Laurent Sifre","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sifre, Laurent","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050359774","display_name":"Nathalie Beauguerlange","orcid":"https://orcid.org/0000-0002-6246-4279"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Beauguerlange, Nathalie","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006533777","display_name":"R\u00e9mi Munos","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Munos, Remi","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091771290","display_name":"David Silver","orcid":"https://orcid.org/0000-0002-5197-2892"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Silver, David","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065366930","display_name":"Satinder Singh","orcid":"https://orcid.org/0000-0002-2736-7641"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Singh, Satinder","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005349213","display_name":"Demis Hassabis","orcid":"https://orcid.org/0000-0003-2812-9917"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hassabis, Demis","raw_affiliation_strings":["DeepMind"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008547992","display_name":"Karl Tuyls","orcid":"https://orcid.org/0000-0001-7929-1944"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"Google DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Tuyls, Karl","raw_affiliation_strings":["DeepMind"],"raw_orcid":"https://orcid.org/0000-0001-7929-1944","affiliations":[{"raw_affiliation_string":"DeepMind","institution_ids":["https://openalex.org/I4210090411"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":34,"corresponding_author_ids":["https://openalex.org/A5056707583"],"corresponding_institution_ids":["https://openalex.org/I4210090411"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8116000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8116000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12137","display_name":"Economic theories and models","score":0.7986000180244446,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.7562999725341797,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7655911445617676},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5835739970207214},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5570042133331299},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3862202763557434},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.17935362458229065},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.06607648730278015}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7655911445617676},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5835739970207214},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5570042133331299},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3862202763557434},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.17935362458229065},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.06607648730278015}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:zenodo.org:7118519","is_oa":true,"landing_page_url":"https://zenodo.org/record/7118519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},{"id":"doi:10.5281/zenodo.7118519","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.7118519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:7118519","is_oa":true,"landing_page_url":"https://zenodo.org/record/7118519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291"],"abstract_inverted_index":{"<strong>Data":[0],"Release":[1],"for":[2,178],"Article:":[3],"<em>Mastering":[4],"the":[5,21,26,30,76,93,103,115,129,151,176,179],"Game":[6,31],"of":[7,32,102,128],"Stratego":[8,33],"with":[9,34,92],"Model-Free":[10,36],"Multiagent":[11,37],"Reinforcement":[12,38],"Learning</em></strong>":[13],"This":[14,189],"package":[15],"releases":[16],"a":[17,100,126],"Python":[18,56,61],"notebook":[19,42,57],"reproducing":[20],"quantitative<br>":[22],"figures":[23],"featured":[24],"in":[25,90,142],"research":[27],"article":[28],"\"Mastering":[29],"<br>":[35,54],"Learning\".":[39],"<strong>Usage</strong>":[40],"The":[41,55],"can":[43],"be":[44],"uploaded":[45],"to":[46,141],"and":[47,64,184],"executed":[48],"using":[49],"the<br>":[50],"[Colab](https://colab.research.google.com)":[51],"runtime":[52],"service.":[53],"is":[58,73,190],"tested":[59],"against":[60],"`3.7`.":[62],"<strong>License":[63],"disclaimer</strong>":[65],"Copyright":[66],"2022":[67],"DeepMind":[68],"Technologies":[69],"Limited":[70],"All":[71,109],"software":[72,145],"licensed":[74,113],"under":[75,114,150,186],"Apache":[77,94,104,152],"License,":[78],"Version":[79],"2.0":[80,95,105,153],"(Apache":[81],"2.0);":[82],"you<br>":[83],"may":[84,124],"not":[85,191],"use":[86],"this":[87],"file":[88],"except":[89],"compliance":[91],"license.":[96],"You":[97,123],"may<br>":[98],"obtain":[99,125],"copy":[101,127],"license":[106,131],"at:<br>":[107,132],"https://www.apache.org/licenses/LICENSE-2.0":[108],"other":[110],"materials":[111,147],"are":[112],"Creative":[116],"Commons":[117],"Attribution":[118],"4.0<br>":[119],"International":[120],"License":[121],"(CC-BY).":[122],"CC-BY":[130,155],"https://creativecommons.org/licenses/by/4.0/legalcode":[133],"Unless":[134],"required":[135],"by":[136],"applicable":[137],"law":[138],"or":[139,154,173],"agreed":[140],"writing,":[143],"all":[144],"and<br>":[146],"distributed":[148,158],"here":[149],"licenses":[156,177],"are<br>":[157],"on":[159],"an":[160,192],"\"AS":[161],"IS\"":[162],"BASIS,":[163],"WITHOUT":[164],"WARRANTIES":[165],"OR":[166],"CONDITIONS":[167],"OF":[168],"ANY":[169],"KIND,<br>":[170],"either":[171],"express":[172],"implied.":[174],"See":[175],"specific":[180],"language":[181],"governing<br>":[182],"permissions":[183],"limitations":[185],"those":[187],"licenses.":[188],"official":[193],"Google":[194],"product.":[195]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
