{"id":"https://openalex.org/W4412106517","doi":"https://doi.org/10.1145/3712256.3726400","title":"MAPLE: Multi-Action Programs through Linear Evolution for Continuous Multi-Action Reinforcement Learning","display_name":"MAPLE: Multi-Action Programs through Linear Evolution for Continuous Multi-Action Reinforcement Learning","publication_year":2025,"publication_date":"2025-07-08","ids":{"openalex":"https://openalex.org/W4412106517","doi":"https://doi.org/10.1145/3712256.3726400"},"language":"en","primary_location":{"id":"doi:10.1145/3712256.3726400","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3712256.3726400","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-05196344v1/file/GECCO_2025_MAPLE_FINAL.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114768746","display_name":"Quentin Vacher","orcid":"https://orcid.org/0009-0001-9568-7196"},"institutions":[{"id":"https://openalex.org/I28221208","display_name":"Institut National des Sciences Appliqu\u00e9es de Rennes","ror":"https://ror.org/04xaa4j22","country_code":"FR","type":"education","lineage":["https://openalex.org/I28221208"]},{"id":"https://openalex.org/I4210100151","display_name":"Institut d'\u00c9lectronique et des Technologies du num\u00e9Rique","ror":"https://ror.org/013q33h79","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I28221208","https://openalex.org/I4210095849","https://openalex.org/I4210100151","https://openalex.org/I56067802","https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Quentin Vacher","raw_affiliation_strings":["Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France"],"raw_orcid":"https://orcid.org/0009-0001-9568-7196","affiliations":[{"raw_affiliation_string":"Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France","institution_ids":["https://openalex.org/I28221208","https://openalex.org/I4210100151"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101949050","display_name":"Stephen Kelly","orcid":"https://orcid.org/0000-0002-6071-4705"},"institutions":[{"id":"https://openalex.org/I98251732","display_name":"McMaster University","ror":"https://ror.org/02fa3aq29","country_code":"CA","type":"education","lineage":["https://openalex.org/I98251732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Stephen Kelly","raw_affiliation_strings":["McMaster University, Hamilton, Canada","McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)"],"raw_orcid":"https://orcid.org/0000-0002-6071-4705","affiliations":[{"raw_affiliation_string":"McMaster University, Hamilton, Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)","institution_ids":["https://openalex.org/I98251732"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ali Naqvi","orcid":"https://orcid.org/0009-0009-5735-4313"},"institutions":[{"id":"https://openalex.org/I98251732","display_name":"McMaster University","ror":"https://ror.org/02fa3aq29","country_code":"CA","type":"education","lineage":["https://openalex.org/I98251732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ali Naqvi","raw_affiliation_strings":["McMaster University, Hamilton, Canada","McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)"],"raw_orcid":"https://orcid.org/0009-0009-5735-4313","affiliations":[{"raw_affiliation_string":"McMaster University, Hamilton, Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)","institution_ids":["https://openalex.org/I98251732"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038179388","display_name":"Nicolas Beuve","orcid":"https://orcid.org/0000-0002-1371-4016"},"institutions":[{"id":"https://openalex.org/I28221208","display_name":"Institut National des Sciences Appliqu\u00e9es de Rennes","ror":"https://ror.org/04xaa4j22","country_code":"FR","type":"education","lineage":["https://openalex.org/I28221208"]},{"id":"https://openalex.org/I4210100151","display_name":"Institut d'\u00c9lectronique et des Technologies du num\u00e9Rique","ror":"https://ror.org/013q33h79","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I28221208","https://openalex.org/I4210095849","https://openalex.org/I4210100151","https://openalex.org/I56067802","https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Nicolas Beuve","raw_affiliation_strings":["Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France"],"raw_orcid":"https://orcid.org/0000-0002-1371-4016","affiliations":[{"raw_affiliation_string":"Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France","institution_ids":["https://openalex.org/I28221208","https://openalex.org/I4210100151"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114768720","display_name":"Tanya Djavaherpour","orcid":null},"institutions":[{"id":"https://openalex.org/I98251732","display_name":"McMaster University","ror":"https://ror.org/02fa3aq29","country_code":"CA","type":"education","lineage":["https://openalex.org/I98251732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tanya Djavaherpour","raw_affiliation_strings":["McMaster University, Hamilton, Canada","McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)"],"raw_orcid":"https://orcid.org/0009-0002-3585-1262","affiliations":[{"raw_affiliation_string":"McMaster University, Hamilton, Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"McMaster University [Hamilton, Ontario] (1280 Main Street West\r\nHamilton, Ontario L8S 4L8 - Canada)","institution_ids":["https://openalex.org/I98251732"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051748007","display_name":"Micka\u00ebl Dardaillon","orcid":"https://orcid.org/0000-0001-6862-2090"},"institutions":[{"id":"https://openalex.org/I28221208","display_name":"Institut National des Sciences Appliqu\u00e9es de Rennes","ror":"https://ror.org/04xaa4j22","country_code":"FR","type":"education","lineage":["https://openalex.org/I28221208"]},{"id":"https://openalex.org/I4210100151","display_name":"Institut d'\u00c9lectronique et des Technologies du num\u00e9Rique","ror":"https://ror.org/013q33h79","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I28221208","https://openalex.org/I4210095849","https://openalex.org/I4210100151","https://openalex.org/I56067802","https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Micka\u00ebl Dardaillon","raw_affiliation_strings":["Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France"],"raw_orcid":"https://orcid.org/0000-0001-6862-2090","affiliations":[{"raw_affiliation_string":"Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France","institution_ids":["https://openalex.org/I28221208","https://openalex.org/I4210100151"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075043317","display_name":"Karol Desnos","orcid":"https://orcid.org/0000-0003-1527-9668"},"institutions":[{"id":"https://openalex.org/I28221208","display_name":"Institut National des Sciences Appliqu\u00e9es de Rennes","ror":"https://ror.org/04xaa4j22","country_code":"FR","type":"education","lineage":["https://openalex.org/I28221208"]},{"id":"https://openalex.org/I4210100151","display_name":"Institut d'\u00c9lectronique et des Technologies du num\u00e9Rique","ror":"https://ror.org/013q33h79","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I28221208","https://openalex.org/I4210095849","https://openalex.org/I4210100151","https://openalex.org/I56067802","https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Karol Desnos","raw_affiliation_strings":["Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France"],"raw_orcid":"https://orcid.org/0000-0003-1527-9668","affiliations":[{"raw_affiliation_string":"Univ Rennes, INSA Rennes, CNRS, IETR, Rennes, France","institution_ids":["https://openalex.org/I28221208","https://openalex.org/I4210100151"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5114768746"],"corresponding_institution_ids":["https://openalex.org/I28221208","https://openalex.org/I4210100151"],"apc_list":null,"apc_paid":null,"fwci":2.1149,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.8854787,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1062","last_page":"1071"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9628000259399414,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/maple","display_name":"Maple","score":0.7814682722091675},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.7314215898513794},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6408818960189819},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.621143102645874},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4361686408519745},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.09273353219032288},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.0593583881855011},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.05820870399475098}],"concepts":[{"id":"https://openalex.org/C2780414537","wikidata":"https://www.wikidata.org/wiki/Q42292","display_name":"Maple","level":2,"score":0.7814682722091675},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.7314215898513794},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6408818960189819},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.621143102645874},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4361686408519745},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.09273353219032288},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0593583881855011},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.05820870399475098},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3712256.3726400","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3712256.3726400","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-05196344v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05196344","pdf_url":"https://hal.science/hal-05196344v1/file/GECCO_2025_MAPLE_FINAL.pdf","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2025 Genetic and Evolutionary Computation Conference (GECCO 2025), Jul 2025, Malaga, Spain. pp.1062-1071, &#x27E8;10.1145/3712256.3726400&#x27E9;","raw_type":"Conference papers"},{"id":"pmh:oai:HAL:hal-05158323v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05158323","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"M\u00e1laga, Jul 2025, Malaga, Spain. pp.1062-1071, &#x27E8;10.1145/3712256.3726400&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-05196344v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05196344","pdf_url":"https://hal.science/hal-05196344v1/file/GECCO_2025_MAPLE_FINAL.pdf","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2025 Genetic and Evolutionary Computation Conference (GECCO 2025), Jul 2025, Malaga, Spain. pp.1062-1071, &#x27E8;10.1145/3712256.3726400&#x27E9;","raw_type":"Conference papers"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G25908884","display_name":"Full-stack Optimization of Ultra-low-power TPGs for Intelligent Cyberphysical Systems","funder_award_id":"ANR-22-CE25-0005","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412106517.pdf","grobid_xml":"https://content.openalex.org/works/W4412106517.grobid-xml"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W18781575","https://openalex.org/W1593492645","https://openalex.org/W2061554433","https://openalex.org/W2122107405","https://openalex.org/W2150468603","https://openalex.org/W2969867445","https://openalex.org/W3100789280","https://openalex.org/W3116073702","https://openalex.org/W3177052905","https://openalex.org/W3192708540","https://openalex.org/W3207569066","https://openalex.org/W3216772467","https://openalex.org/W4214717370","https://openalex.org/W4226043654","https://openalex.org/W4232961138","https://openalex.org/W4237617116","https://openalex.org/W4247010906","https://openalex.org/W4285805590","https://openalex.org/W4365806381","https://openalex.org/W4386193536","https://openalex.org/W4388134984"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3008027610","https://openalex.org/W2619973341","https://openalex.org/W4300811723","https://openalex.org/W2210259036","https://openalex.org/W2019433297","https://openalex.org/W4399716563","https://openalex.org/W2970670716"],"abstract_inverted_index":{"Over":[0],"the":[1,4,28,45,105,125,159,173,182],"last":[2],"decades,":[3],"need":[5],"to":[6,143,168],"solve":[7],"complex":[8],"tasks":[9],"using":[10],"machine":[11],"learning":[12,18],"techniques":[13],"has":[14],"grown":[15],"significantly.":[16],"Deep":[17],"algorithms":[19,132],"achieve":[20],"state-of-the-art":[21,130],"performance":[22,142],"in":[23,78,83,103,149,191],"most":[24],"tasks,":[25,66],"but":[26],"at":[27],"cost":[29],"of":[30,110,172,184],"high":[31],"computational":[32],"complexity":[33],"and":[34,50,69,128,133,188],"limited":[35],"interpretability.":[36],"In":[37,52],"domains":[38],"such":[39],"as":[40,60],"Reinforcement":[41],"Learning":[42],"(RL),":[43],"understanding":[44],"agent":[46,106],"behavior":[47],"ensures":[48],"reliability":[49],"safety.":[51],"this":[53],"work,":[54],"we":[55,92],"explore":[56],"Genetic":[57,113],"Programming":[58],"(GP)":[59],"a":[61,100,108,134,144],"promising":[62],"solution":[63],"for":[64,118,177,186],"RL":[65,137,147],"providing":[67],"simpler":[68],"more":[70],"interpretable":[71,187],"solutions.":[72],"While":[73],"GP":[74,101,131],"achieves":[75,140],"competitive":[76],"results":[77],"low-complexity":[79],"environments,":[80],"it":[81,165],"struggles":[82],"environments":[84,151],"with":[85],"high-dimensional":[86],"action":[87,160],"spaces.":[88],"To":[89],"address":[90],"this,":[91],"propose":[93],"Multi-Action":[94],"Programs":[95,114],"through":[96],"Linear":[97,112],"Evolution":[98],"(MAPLE),":[99],"algorithm":[102],"which":[104,170],"is":[107,122,166],"team":[109],"multiple":[111],"(LGPs),":[115],"each":[116,178],"responsible":[117],"an":[119],"action.":[120,179],"MAPLE":[121,185],"evaluated":[123],"on":[124],"MuJoCo":[126],"suite":[127],"outperforms":[129],"small":[135],"deep":[136,146],"model.":[138],"It":[139],"comparable":[141],"larger":[145],"network":[148],"low-dimensional":[150],"while":[152],"maintaining":[153],"significantly":[154],"lower":[155],"complexity.":[156],"By":[157],"decomposing":[158],"decision":[161],"into":[162],"different":[163],"programs,":[164],"possible":[167],"understand":[169],"parts":[171],"states":[174],"are":[175],"needed":[176],"This":[180],"demonstrates":[181],"potential":[183],"efficient":[189],"solutions":[190],"RL.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":3}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
