{"id":"https://openalex.org/W4381252681","doi":"https://doi.org/10.48550/arxiv.2306.09884","title":"Jumanji: a Diverse Suite of Scalable Reinforcement Learning Environments in JAX","display_name":"Jumanji: a Diverse Suite of Scalable Reinforcement Learning Environments in JAX","publication_year":2023,"publication_date":"2023-06-16","ids":{"openalex":"https://openalex.org/W4381252681","doi":"https://doi.org/10.48550/arxiv.2306.09884"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.09884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.09884","pdf_url":"https://arxiv.org/pdf/2306.09884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.09884","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104096516","display_name":"Cl\u00e9ment Bonnet","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bonnet, Cl\u00e9ment","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100400376","display_name":"Xiapu Luo","orcid":"https://orcid.org/0000-0002-9082-3208"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111129786","display_name":"Donal Byrne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Byrne, Donal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034039171","display_name":"Shikha Surana","orcid":"https://orcid.org/0009-0007-1701-6876"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Surana, Shikha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092207525","display_name":"Vincent Coyette","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abramowitz, Sasha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066670209","display_name":"Paul A. Duckworth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Duckworth, Paul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047239079","display_name":"Laurence I. Midgley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Coyette, Vincent","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051822398","display_name":"Tristan Kalloniatis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Midgley, Laurence I.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036841115","display_name":"Sasha Abramowitz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tegegn, Elshadai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112940692","display_name":"Cemlyn N. Waters","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kalloniatis, Tristan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082924676","display_name":"Andries P. Smit","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mahjoub, Omayma","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032092481","display_name":"Nathan Grinsztajn","orcid":"https://orcid.org/0000-0001-6817-5972"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Macfarlane, Matthew","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019820911","display_name":"Ulrich A. Mbou Sob","orcid":"https://orcid.org/0000-0001-9710-9368"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Smit, Andries P.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016637916","display_name":"Omayma Mahjoub","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Grinsztajn, Nathan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092207523","display_name":"Elshadai Tegegn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boige, Raphael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092207524","display_name":"Mohamed A. Mimouni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Waters, Cemlyn N.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012539791","display_name":"Raphael Boige","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mimouni, Mohamed A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037797948","display_name":"Ruan de Kock","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sob, Ulrich A. Mbou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023452296","display_name":"Daniel Furelos-Blanco","orcid":"https://orcid.org/0000-0001-7461-1910"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Kock, Ruan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102525201","display_name":"Victor Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Siddarth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017043594","display_name":"Arnu Pretorius","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Furelos-Blanco, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069279442","display_name":"Alexandre Laterre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Le, Victor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Pretorius, Arnu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pretorius, Arnu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Laterre, Alexandre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laterre, Alexandre","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":24,"corresponding_author_ids":["https://openalex.org/A5104096516"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9336000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11675","display_name":"Open Source Software Innovations","score":0.9257000088691711,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.897598385810852},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8430824279785156},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.8382655382156372},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8080016374588013},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.7222879528999329},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.5789508819580078},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5641748905181885},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5149403214454651},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5043014287948608},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5036007761955261},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.37196123600006104},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.334482878446579},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.32321569323539734},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29351601004600525},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17953899502754211},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1264028251171112},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.07054257392883301}],"concepts":[{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.897598385810852},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8430824279785156},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.8382655382156372},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8080016374588013},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.7222879528999329},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.5789508819580078},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5641748905181885},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5149403214454651},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5043014287948608},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5036007761955261},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.37196123600006104},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.334482878446579},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32321569323539734},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29351601004600525},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17953899502754211},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1264028251171112},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.07054257392883301},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.09884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.09884","pdf_url":"https://arxiv.org/pdf/2306.09884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.09884","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.09884","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.09884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.09884","pdf_url":"https://arxiv.org/pdf/2306.09884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6100000143051147,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4381252681.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2357124094","https://openalex.org/W2387399993","https://openalex.org/W2389739210","https://openalex.org/W2348924972","https://openalex.org/W2365736347","https://openalex.org/W2047454415","https://openalex.org/W2070040999","https://openalex.org/W2387293848","https://openalex.org/W2250140200","https://openalex.org/W3088304681"],"abstract_inverted_index":{"Open-source":[0],"reinforcement":[1],"learning":[2],"(RL)":[3],"environments":[4,29,57,71],"have":[5],"played":[6],"a":[7,25,41,52,68,159],"crucial":[8],"role":[9],"in":[10,13,40,78],"driving":[11],"progress":[12],"the":[14,89,128],"development":[15],"of":[16,44,54,70,91,104,167],"AI":[17],"algorithms.":[18],"In":[19],"modern":[20],"RL":[21,56,117,168],"research,":[22],"there":[23],"is":[24,121],"need":[26],"for":[27,143,162],"simulated":[28],"that":[30],"are":[31],"performant,":[32],"scalable,":[33],"and":[34,64,93,98,107,132,152,165],"modular":[35],"to":[36,60,126,135,157],"enable":[37],"their":[38,136],"utilization":[39],"wider":[42],"range":[43],"potential":[45],"real-world":[46],"applications.":[47],"Therefore,":[48],"we":[49,139],"present":[50],"Jumanji,":[51],"suite":[53,69],"diverse":[55],"specifically":[58],"designed":[59],"be":[61],"fast,":[62],"flexible,":[63],"scalable.":[65],"Jumanji":[66,100,120,155],"provides":[67],"focusing":[72],"on":[73,150],"combinatorial":[74],"problems":[75],"frequently":[76],"encountered":[77],"industry,":[79],"as":[80,82],"well":[81],"challenging":[83],"general":[84],"decision-making":[85],"tasks.":[86],"By":[87],"leveraging":[88],"efficiency":[90],"JAX":[92],"hardware":[94],"accelerators":[95],"like":[96],"GPUs":[97],"TPUs,":[99],"enables":[101],"rapid":[102],"iteration":[103],"research":[105],"ideas":[106],"large-scale":[108],"experimentation,":[109],"ultimately":[110],"empowering":[111],"more":[112],"capable":[113],"agents.":[114],"Unlike":[115],"existing":[116],"environment":[118],"suites,":[119],"highly":[122],"customizable,":[123],"allowing":[124],"users":[125],"tailor":[127],"initial":[129],"state":[130],"distribution":[131],"problem":[133],"complexity":[134],"needs.":[137],"Furthermore,":[138],"provide":[140],"actor-critic":[141],"baselines":[142],"each":[144],"environment,":[145],"accompanied":[146],"by":[147],"preliminary":[148],"findings":[149],"scaling":[151],"generalization":[153],"scenarios.":[154],"aims":[156],"set":[158],"new":[160],"standard":[161],"speed,":[163],"adaptability,":[164],"scalability":[166],"environments.":[169]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
