{"id":"https://openalex.org/W4412106618","doi":"https://doi.org/10.1145/3712256.3726335","title":"Scaling Policy Gradient Quality-Diversity with Massive Parallelization via Behavioral Variations","display_name":"Scaling Policy Gradient Quality-Diversity with Massive Parallelization via Behavioral Variations","publication_year":2025,"publication_date":"2025-07-08","ids":{"openalex":"https://openalex.org/W4412106618","doi":"https://doi.org/10.1145/3712256.3726335"},"language":"en","primary_location":{"id":"doi:10.1145/3712256.3726335","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712256.3726335","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3712256.3726335","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116129717","display_name":"Konstantinos Mitsides","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Konstantinos Mitsides","raw_affiliation_strings":["Imperial College London, London, United Kingdom"],"raw_orcid":"https://orcid.org/0009-0007-1363-9777","affiliations":[{"raw_affiliation_string":"Imperial College London, London, United Kingdom","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082433472","display_name":"Maxence Faldor","orcid":"https://orcid.org/0000-0003-4743-9494"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Maxence Faldor","raw_affiliation_strings":["Imperial College London, London, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-4743-9494","affiliations":[{"raw_affiliation_string":"Imperial College London, London, United Kingdom","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011747084","display_name":"Antoine Cully","orcid":"https://orcid.org/0000-0002-3190-7073"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Antoine Cully","raw_affiliation_strings":["Imperial College London, London, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-3190-7073","affiliations":[{"raw_affiliation_string":"Imperial College London, London, United Kingdom","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6376,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.67948718,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1282","last_page":"1290"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.7503834366798401},{"id":"https://openalex.org/keywords/diversity","display_name":"Diversity (politics)","score":0.6723113059997559},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5865466594696045},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5143080949783325},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.37547367811203003},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11962509155273438},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.10255280137062073},{"id":"https://openalex.org/keywords/epistemology","display_name":"Epistemology","score":0.07685324549674988}],"concepts":[{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.7503834366798401},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.6723113059997559},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5865466594696045},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5143080949783325},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.37547367811203003},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11962509155273438},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.10255280137062073},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.07685324549674988},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3712256.3726335","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712256.3726335","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3712256.3726335","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712256.3726335","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W102487131","https://openalex.org/W1738827650","https://openalex.org/W2119717200","https://openalex.org/W2145339207","https://openalex.org/W2462548332","https://openalex.org/W2492794003","https://openalex.org/W2620641794","https://openalex.org/W2963776872","https://openalex.org/W3004042307","https://openalex.org/W3009830825","https://openalex.org/W3018036994","https://openalex.org/W3112009288","https://openalex.org/W3129322645","https://openalex.org/W4365800092","https://openalex.org/W4384024810","https://openalex.org/W4386523338"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Quality-Diversity":[0],"optimization":[1],"comprises":[2],"a":[3,11,20,103,163,178],"family":[4],"of":[5,13,34,110,166],"evolutionary":[6,29],"algorithms":[7,191],"aimed":[8],"at":[9,67],"generating":[10],"collection":[12,165],"diverse":[14,164],"and":[15,147],"high-performing":[16,167],"solutions.":[17,48],"MAP-Elites":[18],"(ME),":[19],"notable":[21],"example,":[22],"is":[23],"used":[24],"effectively":[25],"in":[26,82,172],"fields":[27],"like":[28,58],"robotics.":[30],"However,":[31],"the":[32],"reliance":[33,93],"ME":[35,69,106],"on":[36,94,133,142,177,184],"random":[37],"mutations":[38],"from":[39,76],"Genetic":[40],"Algorithms":[41],"limits":[42],"its":[43],"ability":[44],"to":[45,51,88,151],"evolve":[46],"high-dimensional":[47],"Methods":[49],"proposed":[50],"overcome":[52],"this":[53,99],"include":[54],"using":[55,153],"gradient-based":[56],"operators":[57],"policy":[59,126,154],"gradients":[60],"or":[61,80,92],"natural":[62],"evolution":[63],"strategies.":[64],"While":[65],"successful":[66],"scaling":[68,83,111],"for":[70],"neuroevolution,":[71],"these":[72,149],"methods":[73],"often":[74],"suffer":[75],"slow":[77],"training":[78],"speeds,":[79],"difficulties":[81],"with":[84,112],"massive":[85,113],"parallelization":[86],"due":[87],"high":[89],"computational":[90],"demands":[91],"centralized":[95,134],"actor-critic":[96,135],"training.":[97,136],"In":[98],"work,":[100],"we":[101],"introduce":[102],"fast,":[104],"sample-efficient":[105],"based":[107,141],"algorithm":[108],"capable":[109],"parallelization,":[114],"significantly":[115],"reducing":[116],"runtimes":[117],"without":[118],"compromising":[119],"performance.":[120],"Our":[121,156],"method,":[122],"ASCII-ME,":[123],"unlike":[124],"existing":[125],"gradient":[127],"quality-diversity":[128],"methods,":[129],"does":[130],"not":[131],"rely":[132],"It":[137],"performs":[138],"behavioral":[139],"variations":[140,150],"time":[143],"step":[144],"performance":[145],"metrics":[146],"maps":[148],"solutions":[152],"gradients.":[155],"experiments":[157],"show":[158],"that":[159],"ASCII-ME":[160],"can":[161],"generate":[162],"deep":[168],"neural":[169],"network":[170],"policies":[171],"less":[173],"than":[174,189],"250":[175],"seconds":[176],"single":[179],"GPU.":[180],"Additionally,":[181],"it":[182],"operates":[183],"average,":[185],"five":[186],"times":[187],"faster":[188],"state-of-the-art":[190],"while":[192],"maintaining":[193],"competitive":[194],"sample":[195],"efficiency.":[196]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
