{"id":"https://openalex.org/W7131812903","doi":"https://doi.org/10.1016/j.simpa.2026.100829","title":"Gym-TORAX: Open-source software for integrating reinforcement learning with plasma control simulators in tokamak research","display_name":"Gym-TORAX: Open-source software for integrating reinforcement learning with plasma control simulators in tokamak research","publication_year":2026,"publication_date":"2026-02-27","ids":{"openalex":"https://openalex.org/W7131812903","doi":"https://doi.org/10.1016/j.simpa.2026.100829"},"language":"en","primary_location":{"id":"doi:10.1016/j.simpa.2026.100829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.simpa.2026.100829","pdf_url":null,"source":{"id":"https://openalex.org/S4210180398","display_name":"Software Impacts","issn_l":"2665-9638","issn":["2665-9638"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software Impacts","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1016/j.simpa.2026.100829","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119307055","display_name":"Antoine Mouchamps","orcid":null},"institutions":[{"id":"https://openalex.org/I157674565","display_name":"University of Li\u00e8ge","ror":"https://ror.org/00afp2z80","country_code":"BE","type":"education","lineage":["https://openalex.org/I157674565"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Antoine Mouchamps","raw_affiliation_strings":["Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium"],"affiliations":[{"raw_affiliation_string":"Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium","institution_ids":["https://openalex.org/I157674565"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115624520","display_name":"Arthur Malherbe","orcid":null},"institutions":[{"id":"https://openalex.org/I157674565","display_name":"University of Li\u00e8ge","ror":"https://ror.org/00afp2z80","country_code":"BE","type":"education","lineage":["https://openalex.org/I157674565"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Arthur Malherbe","raw_affiliation_strings":["Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium"],"affiliations":[{"raw_affiliation_string":"Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium","institution_ids":["https://openalex.org/I157674565"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075103449","display_name":"Adrien Bolland","orcid":null},"institutions":[{"id":"https://openalex.org/I157674565","display_name":"University of Li\u00e8ge","ror":"https://ror.org/00afp2z80","country_code":"BE","type":"education","lineage":["https://openalex.org/I157674565"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Adrien Bolland","raw_affiliation_strings":["Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium"],"affiliations":[{"raw_affiliation_string":"Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium","institution_ids":["https://openalex.org/I157674565"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077011518","display_name":"Damien Ernst","orcid":"https://orcid.org/0000-0002-3035-8260"},"institutions":[{"id":"https://openalex.org/I157674565","display_name":"University of Li\u00e8ge","ror":"https://ror.org/00afp2z80","country_code":"BE","type":"education","lineage":["https://openalex.org/I157674565"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Damien Ernst","raw_affiliation_strings":["Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium"],"affiliations":[{"raw_affiliation_string":"Montefiore Institute, University of Li\u00e8ge, Li\u00e8ge, Belgium","institution_ids":["https://openalex.org/I157674565"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5119307055"],"corresponding_institution_ids":["https://openalex.org/I157674565"],"apc_list":{"value":450,"currency":"USD","value_usd":450},"apc_paid":{"value":450,"currency":"USD","value_usd":450},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.57076708,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":null,"first_page":"100829","last_page":"100829"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.6590999960899353,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.6590999960899353,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.04699999839067459,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12007","display_name":"Plasma and Flow Control in Aerodynamics","score":0.018200000748038292,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7867000102996826},{"id":"https://openalex.org/keywords/tokamak","display_name":"Tokamak","score":0.7293999791145325},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.5950000286102295},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4345000088214874},{"id":"https://openalex.org/keywords/thermonuclear-fusion","display_name":"Thermonuclear fusion","score":0.40549999475479126},{"id":"https://openalex.org/keywords/plasma","display_name":"Plasma","score":0.3982999920845032}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7867000102996826},{"id":"https://openalex.org/C116515362","wikidata":"https://www.wikidata.org/wiki/Q188589","display_name":"Tokamak","level":3,"score":0.7293999791145325},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6428999900817871},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.5950000286102295},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4345000088214874},{"id":"https://openalex.org/C72260207","wikidata":"https://www.wikidata.org/wiki/Q7783221","display_name":"Thermonuclear fusion","level":3,"score":0.40549999475479126},{"id":"https://openalex.org/C82706917","wikidata":"https://www.wikidata.org/wiki/Q10251","display_name":"Plasma","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3328000009059906},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.31439998745918274},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3109999895095825},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.26930001378059387}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1016/j.simpa.2026.100829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.simpa.2026.100829","pdf_url":null,"source":{"id":"https://openalex.org/S4210180398","display_name":"Software Impacts","issn_l":"2665-9638","issn":["2665-9638"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software Impacts","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2510.11283","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.11283","pdf_url":"https://arxiv.org/pdf/2510.11283","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:orbi.ulg.ac.be:2268/336745","is_oa":true,"landing_page_url":"https://orbi.uliege.be/handle/2268/336745","pdf_url":"https://orbi.uliege.be/bitstream/2268/336745/1/Gym-TORAX%20Open-source%20software%20for%20integrating%20RL%20with%20plasma%20control%20simulators.pdf","source":{"id":"https://openalex.org/S4306401300","display_name":"ORBi (University of Li\u00e8ge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I157674565","host_organization_name":"University of Li\u00e8ge","host_organization_lineage":["https://openalex.org/I157674565"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Software Impacts, 27, 100829 (2026-03-04)","raw_type":"peer reviewed"}],"best_oa_location":{"id":"doi:10.1016/j.simpa.2026.100829","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.simpa.2026.100829","pdf_url":null,"source":{"id":"https://openalex.org/S4210180398","display_name":"Software Impacts","issn_l":"2665-9638","issn":["2665-9638"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software Impacts","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1977655452","https://openalex.org/W2003283650","https://openalex.org/W2033549247","https://openalex.org/W2081965316","https://openalex.org/W3102560187","https://openalex.org/W3137465606","https://openalex.org/W3160501851","https://openalex.org/W3179456407","https://openalex.org/W4211151981","https://openalex.org/W4213377513","https://openalex.org/W4247314385","https://openalex.org/W4392015292"],"related_works":[],"abstract_inverted_index":{"This":[0,59],"paper":[1],"presents":[2],"Gym-TORAX,":[3],"a":[4,20,27,31],"Python":[5],"package":[6],"to":[7,52,71],"define":[8],"Reinforcement":[9,96,104],"Learning":[10],"(RL)":[11],"environments":[12],"for":[13,101,106,113],"plasma":[14,36,41,46,60,108,115],"control":[15,61],"in":[16,99],"tokamaks.":[17],"Gym-TORAX":[18],"instantiates":[19],"Gymnasium":[21,100],"environment":[22,39,82,98],"from":[23],"an":[24,88],"action":[25],"space,":[26,29],"state-observation":[28],"and":[30,48,69,75],"reward":[32],"function":[33],"that":[34],"measures":[35],"characteristics.":[37],"The":[38],"computes":[40],"states":[42],"using":[43],"the":[44,49,54],"TORAX":[45,111],"simulator":[47],"objective":[50],"is":[51,63,83],"maximize":[53],"expected":[55],"sum":[56],"of":[57],"rewards.":[58],"formalization":[62],"compatible":[64],"with":[65],"most":[66],"RL":[67,73],"algorithms":[68],"libraries":[70],"facilitate":[72],"research":[74],"applications.":[76],"In":[77],"its":[78],"current":[79],"version,":[80],"one":[81],"readily":[84],"available,":[85],"based":[86],"on":[87],"International":[89],"Thermonuclear":[90],"Experimental":[91],"Reactor":[92],"(ITER)":[93],"scenario.":[94],"\u2022":[95,103,110],"learning":[97,105],"cross-compatibility.":[102],"tokamak":[107],"control.":[109],"simulations":[112],"dynamic":[114],"modeling.":[116]},"counts_by_year":[],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-12-10T00:00:00"}
