{"id":"https://openalex.org/W4310173005","doi":"https://doi.org/10.1109/sbgames56371.2022.9961113","title":"DRLeague: a Novel 3D Environment for Training Reinforcement Learning Agents","display_name":"DRLeague: a Novel 3D Environment for Training Reinforcement Learning Agents","publication_year":2022,"publication_date":"2022-10-24","ids":{"openalex":"https://openalex.org/W4310173005","doi":"https://doi.org/10.1109/sbgames56371.2022.9961113"},"language":"en","primary_location":{"id":"doi:10.1109/sbgames56371.2022.9961113","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sbgames56371.2022.9961113","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 21st Brazilian Symposium on Computer Games and Digital Entertainment (SBGames)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070415192","display_name":"Hyuan P. Farrapo","orcid":null},"institutions":[{"id":"https://openalex.org/I243754102","display_name":"Universidade Federal do Cear\u00e1","ror":"https://ror.org/03srtnf24","country_code":"BR","type":"education","lineage":["https://openalex.org/I243754102"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Hyuan P. Farrapo","raw_affiliation_strings":["Virtual UFC Institute, Federal University of Ceara,Fortaleza,Brazil","Virtual UFC Institute, Federal University of Ceara, Fortaleza, Brazil"],"affiliations":[{"raw_affiliation_string":"Virtual UFC Institute, Federal University of Ceara,Fortaleza,Brazil","institution_ids":["https://openalex.org/I243754102"]},{"raw_affiliation_string":"Virtual UFC Institute, Federal University of Ceara, Fortaleza, Brazil","institution_ids":["https://openalex.org/I243754102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089205455","display_name":"Romulo F. F\u00e9rrer Filho","orcid":"https://orcid.org/0000-0001-5084-4867"},"institutions":[{"id":"https://openalex.org/I243754102","display_name":"Universidade Federal do Cear\u00e1","ror":"https://ror.org/03srtnf24","country_code":"BR","type":"education","lineage":["https://openalex.org/I243754102"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Romulo F. F. Filho","raw_affiliation_strings":["Federal University of Cear&#x00E1;,Department of Computing,Fortaleza,Brazil"],"affiliations":[{"raw_affiliation_string":"Federal University of Cear&#x00E1;,Department of Computing,Fortaleza,Brazil","institution_ids":["https://openalex.org/I243754102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021788425","display_name":"Jos\u00e9 Gilvan Rodrigues Maia","orcid":"https://orcid.org/0000-0002-2607-2729"},"institutions":[{"id":"https://openalex.org/I243754102","display_name":"Universidade Federal do Cear\u00e1","ror":"https://ror.org/03srtnf24","country_code":"BR","type":"education","lineage":["https://openalex.org/I243754102"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Jose G. R. Maia","raw_affiliation_strings":["Virtual UFC Institute, Federal University of Cear&#x00E1;,Fortaleza,Brazil"],"affiliations":[{"raw_affiliation_string":"Virtual UFC Institute, Federal University of Cear&#x00E1;,Fortaleza,Brazil","institution_ids":["https://openalex.org/I243754102"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030350071","display_name":"Paulo Bruno S. Serafim","orcid":"https://orcid.org/0000-0002-5980-8149"},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210106545","display_name":"Centre Inria d'Universit\u00e9 C\u00f4te d'Azur","ror":"https://ror.org/01nzkaw91","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I201841394","https://openalex.org/I4210106545"]},{"id":"https://openalex.org/I4210150884","display_name":"Fondation Sophia Antipolis","ror":"https://ror.org/05nkcfv27","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210150884"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Paulo B. S. Serafim","raw_affiliation_strings":["COATI, Inria Sophia Antipolis,Sophia Antipolis,France","COATI, Inria Sophia Antipolis, Sophia Antipolis, France"],"affiliations":[{"raw_affiliation_string":"COATI, Inria Sophia Antipolis,Sophia Antipolis,France","institution_ids":["https://openalex.org/I4210150884","https://openalex.org/I4210106545","https://openalex.org/I1326498283"]},{"raw_affiliation_string":"COATI, Inria Sophia Antipolis, Sophia Antipolis, France","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5070415192"],"corresponding_institution_ids":["https://openalex.org/I243754102"],"apc_list":null,"apc_paid":null,"fwci":0.1379,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.55885533,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9763000011444092,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7092170119285583},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6680361032485962},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6265743374824524},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4259776175022125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3622061610221863},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.04831400513648987}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7092170119285583},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6680361032485962},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6265743374824524},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4259776175022125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3622061610221863},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.04831400513648987},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/sbgames56371.2022.9961113","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sbgames56371.2022.9961113","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 21st Brazilian Symposium on Computer Games and Digital Entertainment (SBGames)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2150468603","https://openalex.org/W2736601468","https://openalex.org/W2749807327","https://openalex.org/W2889987506","https://openalex.org/W2890827732","https://openalex.org/W2941355526","https://openalex.org/W2963871073","https://openalex.org/W2996037775","https://openalex.org/W2997502221","https://openalex.org/W3011120880","https://openalex.org/W3157911183","https://openalex.org/W4298857966","https://openalex.org/W4309432140","https://openalex.org/W6637967152","https://openalex.org/W6741002519","https://openalex.org/W6743756900","https://openalex.org/W6753526802","https://openalex.org/W6754583135","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W230091440","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2233261550","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2810751659","https://openalex.org/W258997015"],"abstract_inverted_index":{"The":[0],"development":[1],"of":[2,31,55,145,166,181],"autonomous":[3],"agents":[4,167],"performing":[5],"unique":[6],"interactions":[7],"that":[8,33],"resemble":[9],"human-like":[10],"behavior":[11],"is":[12,34],"currently":[13],"driven":[14],"by":[15,36,102],"Deep":[16],"Reinforcement":[17],"Learning":[18],"(DRL)":[19],"techniques":[20],"combined":[21],"with":[22,126],"complex":[23,66,149],"virtual":[24],"environments.":[25],"These":[26],"constitute":[27],"an":[28],"active":[29],"field":[30],"research":[32],"fueled":[35],"environments":[37],"usually":[38],"inspired":[39,101],"or":[40],"borrowed":[41],"from":[42,123],"video":[43],"games.":[44],"Although":[45],"works":[46],"in":[47,178],"the":[48,103,111,121,152,163,179],"area":[49],"commonly":[50],"do":[51],"not":[52],"make":[53],"use":[54],"trending":[56],"3D":[57,99],"games,":[58],"these":[59,146],"games":[60,100],"are":[61],"interesting":[62],"testbeds":[63],"for":[64,98],"more":[65,75,148],"and":[67,92,130,141],"compelling":[68],"behaviors,":[69],"as":[70,174],"they":[71],"tend":[72],"to":[73,89],"explore":[74],"variables":[76],"than":[77,151],"their":[78],"predecessors.":[79],"This":[80],"paper":[81],"introduces":[82],"DRLeague,":[83],"a":[84,175],"novel":[85],"DRL":[86],"environment,":[87],"proposed":[88],"be":[90],"open-source,":[91],"easily":[93],"customizable,":[94],"which":[95],"supports":[96],"mechanics":[97,122],"popular":[104],"\u201ccar":[105],"football\u201d":[106],"game":[107],"Rocket":[108],"League.":[109],"Besides":[110],"typical":[112],"gameplay,":[113],"we":[114,156],"implemented":[115],"four":[116],"challenging":[117],"minigames":[118],"based":[119],"on":[120],"this":[124],"title":[125],"advanced":[127],"physics":[128],"simulation":[129],"fine-grained":[131],"car":[132],"control:":[133],"penalty":[134,137],"shoot,":[135,138,143],"multiplayer":[136],"barrier":[139],"kick,":[140],"aerial":[142],"each":[144],"requiring":[147],"skills":[150],"previous":[153],"ones.":[154],"Finally,":[155],"provide":[157],"solid":[158],"baseline":[159],"experimental":[160],"results":[161],"showing":[162],"learning":[164,183],"progress":[165],"using":[168],"Unity's":[169],"ML-Agents":[170],"toolkit,":[171],"evidencing":[172],"DRLeague":[173],"suitable":[176],"testbed":[177],"application":[180],"machine":[182],"techniques.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
