{"id":"https://openalex.org/W4310113594","doi":"https://doi.org/10.1145/3568562.3568579","title":"Benchmarking Gradient Estimation Mechanisms in Evolution Strategies for Solving Black-Box Optimization Functions and Reinforcement Learning Problems","display_name":"Benchmarking Gradient Estimation Mechanisms in Evolution Strategies for Solving Black-Box Optimization Functions and Reinforcement Learning Problems","publication_year":2022,"publication_date":"2022-11-29","ids":{"openalex":"https://openalex.org/W4310113594","doi":"https://doi.org/10.1145/3568562.3568579"},"language":"en","primary_location":{"id":"doi:10.1145/3568562.3568579","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3568562.3568579","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 11th International Symposium on Information and Communication Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054013911","display_name":"Thai Bao Tran","orcid":"https://orcid.org/0000-0002-5876-4092"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Thai Bao Tran","raw_affiliation_strings":["University of Information Technology, Viet Nam and Vietnam National University Ho Chi Minh City, Vietnam"],"raw_orcid":"https://orcid.org/0000-0002-5876-4092","affiliations":[{"raw_affiliation_string":"University of Information Technology, Viet Nam and Vietnam National University Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081219326","display_name":"Ngoc Hoang Luong","orcid":"https://orcid.org/0000-0002-6768-1950"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Ngoc Hoang Luong","raw_affiliation_strings":["University of Information Technology, Viet Nam and Vietnam National University Ho Chi Minh City, Vietnam"],"raw_orcid":"https://orcid.org/0000-0002-6768-1950","affiliations":[{"raw_affiliation_string":"University of Information Technology, Viet Nam and Vietnam National University Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5054013911"],"corresponding_institution_ids":["https://openalex.org/I123565023"],"apc_list":null,"apc_paid":null,"fwci":0.1387,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.5618197,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"39","last_page":"46"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7057561278343201},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6172826290130615},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6009026169776917},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5224986672401428},{"id":"https://openalex.org/keywords/cma-es","display_name":"CMA-ES","score":0.48132288455963135},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.45311886072158813},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42187952995300293},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3994585871696472},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.36108970642089844},{"id":"https://openalex.org/keywords/evolutionary-computation","display_name":"Evolutionary computation","score":0.3533323109149933},{"id":"https://openalex.org/keywords/evolution-strategy","display_name":"Evolution strategy","score":0.3333275318145752},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.25074756145477295}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7057561278343201},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6172826290130615},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6009026169776917},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5224986672401428},{"id":"https://openalex.org/C205555498","wikidata":"https://www.wikidata.org/wiki/Q505588","display_name":"CMA-ES","level":4,"score":0.48132288455963135},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.45311886072158813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42187952995300293},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3994585871696472},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.36108970642089844},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.3533323109149933},{"id":"https://openalex.org/C207002847","wikidata":"https://www.wikidata.org/wiki/Q2912857","display_name":"Evolution strategy","level":3,"score":0.3333275318145752},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.25074756145477295},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3568562.3568579","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3568562.3568579","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 11th International Symposium on Information and Communication Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W1506498113","https://openalex.org/W2112036188","https://openalex.org/W2149479912","https://openalex.org/W2963345217","https://openalex.org/W4211214963"],"related_works":["https://openalex.org/W1579744901","https://openalex.org/W1492325323","https://openalex.org/W2510724351","https://openalex.org/W3087341323","https://openalex.org/W2465356436","https://openalex.org/W2552260697","https://openalex.org/W2592891920","https://openalex.org/W2168924884","https://openalex.org/W2102869784","https://openalex.org/W2116954712"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"investigate":[4],"the":[5,15,19,25,46,54,78,121,128],"gradient":[6,56,87],"estimation":[7],"mechanisms":[8],"of":[9,53,103,124],"three":[10],"evolution":[11],"strategies":[12],"(ES)":[13],"algorithms:":[14],"vanilla":[16,31],"ES":[17,32],"(VES),":[18],"Guided":[20],"Evolutionary":[21],"Strategies":[22,28],"(GES),":[23],"and":[24,67,111,127],"Self-Guided":[26],"Evolution":[27],"(SGES).":[29],"The":[30],"generates":[33],"search":[34,83],"directions":[35,84],"(i.e.,":[36],"its":[37],"population":[38],"individuals)":[39],"following":[40],"an":[41],"isotropic":[42],"Gaussian":[43],"distribution":[44],"from":[45,60,81],"full":[47],"parameter":[48],"space,":[49],"yielding":[50],"unbiased":[51],"estimations":[52],"true":[55,79],"vectors":[57],"but":[58],"suffering":[59],"sample":[61],"inefficiency":[62],"in":[63,92,140],"high-dimensional":[64,104],"problems.":[65,144],"GES":[66],"SGES":[68],"aim":[69],"to":[70,133],"construct":[71],"low-dimensional":[72],"guiding":[73],"subspaces,":[74],"that":[75,131],"potentially":[76],"contain":[77],"gradients,":[80],"which":[82],"for":[85,136],"computing":[86],"estimates":[88],"can":[89],"be":[90,134],"generated":[91],"a":[93,101],"more":[94],"efficient":[95],"manner.":[96],"We":[97],"perform":[98],"experiments":[99],"with":[100],"variety":[102],"optimization":[105,143],"problems,":[106],"including":[107],"multi-modal":[108],"black-box":[109],"functions":[110],"noisy":[112],"reinforcement":[113],"learning":[114],"locomotion":[115],"tasks.":[116],"Experimental":[117],"results":[118],"help":[119],"pinpoint":[120],"essential":[122],"components":[123],"these":[125],"algorithms":[126],"important":[129],"issues":[130],"need":[132],"considered":[135],"their":[137],"successful":[138],"applications":[139],"solving":[141],"challenging":[142],"Source":[145],"code":[146],"is":[147],"available":[148],"at:":[149],"https://github.com/ELO-Lab/BenchGEM-ES.":[150]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
