{"id":"https://openalex.org/W3006079285","doi":"https://doi.org/10.1145/3377930.3389842","title":"Effective reinforcement learning through evolutionary surrogate-assisted prescription","display_name":"Effective reinforcement learning through evolutionary surrogate-assisted prescription","publication_year":2020,"publication_date":"2020-06-25","ids":{"openalex":"https://openalex.org/W3006079285","doi":"https://doi.org/10.1145/3377930.3389842","mag":"3006079285"},"language":"en","primary_location":{"id":"doi:10.1145/3377930.3389842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377930.3389842","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2002.05368","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002978952","display_name":"Olivier Francon","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Olivier Francon","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066709653","display_name":"Santiago Gonz\u00e1lez","orcid":"https://orcid.org/0000-0001-5685-4580"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Santiago Gonzalez","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035553462","display_name":"Babak Hodjat","orcid":"https://orcid.org/0000-0002-4547-4731"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Babak Hodjat","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020821744","display_name":"Elliot Meyerson","orcid":"https://orcid.org/0000-0002-1871-2757"},"institutions":[{"id":"https://openalex.org/I1321014770","display_name":"Association for Computing Machinery","ror":"https://ror.org/03wsadn68","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1321014770"]},{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Elliot Meyerson","raw_affiliation_strings":["The University of Texas at Austin","Association for Computing Machinery"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"Association for Computing Machinery","institution_ids":["https://openalex.org/I1321014770"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020441009","display_name":"Risto Miikkulainen","orcid":"https://orcid.org/0000-0002-0062-0037"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Risto Miikkulainen","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102019018","display_name":"Xin Qiu","orcid":"https://orcid.org/0000-0001-5358-8854"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Qiu","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034397027","display_name":"Hormoz Shahrzad","orcid":"https://orcid.org/0000-0002-5983-4531"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hormoz Shahrzad","raw_affiliation_strings":["The University of Texas at Austin","the University of Texas at, Austin"],"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"the University of Texas at, Austin","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5002978952"],"corresponding_institution_ids":["https://openalex.org/I86519309"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.0429989,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"814","last_page":"822"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7939821481704712},{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.7423350811004639},{"id":"https://openalex.org/keywords/surrogate-model","display_name":"Surrogate model","score":0.7318651676177979},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6794294118881226},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6570408940315247},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5748111009597778},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5612255930900574},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4576515257358551},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.32407623529434204},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14039385318756104}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7939821481704712},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.7423350811004639},{"id":"https://openalex.org/C131675550","wikidata":"https://www.wikidata.org/wiki/Q7646884","display_name":"Surrogate model","level":2,"score":0.7318651676177979},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794294118881226},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6570408940315247},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5748111009597778},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5612255930900574},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4576515257358551},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32407623529434204},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14039385318756104},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3377930.3389842","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377930.3389842","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2002.05368","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.05368","pdf_url":"https://arxiv.org/pdf/2002.05368","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3006079285","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2002.05368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2002.05368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2002.05368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2002.05368","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.05368","pdf_url":"https://arxiv.org/pdf/2002.05368","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7099999785423279,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3006079285.pdf"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W75550020","https://openalex.org/W86586912","https://openalex.org/W166862392","https://openalex.org/W1522301498","https://openalex.org/W1568845561","https://openalex.org/W1966253115","https://openalex.org/W1987150989","https://openalex.org/W1987725948","https://openalex.org/W2011174137","https://openalex.org/W2013695155","https://openalex.org/W2023626239","https://openalex.org/W2074825805","https://openalex.org/W2074984119","https://openalex.org/W2091565802","https://openalex.org/W2111116266","https://openalex.org/W2113553269","https://openalex.org/W2123408238","https://openalex.org/W2125930537","https://openalex.org/W2131241448","https://openalex.org/W2138116946","https://openalex.org/W2144357723","https://openalex.org/W2145339207","https://openalex.org/W2156106639","https://openalex.org/W2173564293","https://openalex.org/W2174817438","https://openalex.org/W2257979135","https://openalex.org/W2530195778","https://openalex.org/W2547041763","https://openalex.org/W2588207035","https://openalex.org/W2596367596","https://openalex.org/W2726187156","https://openalex.org/W2736601468","https://openalex.org/W2739491397","https://openalex.org/W2778749116","https://openalex.org/W2792012198","https://openalex.org/W2807637204","https://openalex.org/W2890208753","https://openalex.org/W2891186800","https://openalex.org/W2906697496","https://openalex.org/W2909418179","https://openalex.org/W2950995823","https://openalex.org/W2957258712","https://openalex.org/W2962986780","https://openalex.org/W2964043796","https://openalex.org/W2964227899","https://openalex.org/W2990239702","https://openalex.org/W2995333506","https://openalex.org/W2998349125","https://openalex.org/W3011120880","https://openalex.org/W3020436856","https://openalex.org/W3037207827","https://openalex.org/W3089091950","https://openalex.org/W6677067356"],"related_works":["https://openalex.org/W3033575144","https://openalex.org/W2930108284","https://openalex.org/W2165119135","https://openalex.org/W2889012293","https://openalex.org/W762189110","https://openalex.org/W2019161915","https://openalex.org/W1965819279","https://openalex.org/W2161551046","https://openalex.org/W3157235145","https://openalex.org/W3033218991","https://openalex.org/W3113335955","https://openalex.org/W2153303044","https://openalex.org/W112890221","https://openalex.org/W2587934155","https://openalex.org/W3127945807","https://openalex.org/W3117237870","https://openalex.org/W2122442339","https://openalex.org/W3165321979","https://openalex.org/W2883894333","https://openalex.org/W832602732"],"abstract_inverted_index":{"There":[0],"is":[1,31,82,87,98,132],"now":[2],"significant":[3],"historical":[4],"data":[5],"available":[6],"on":[7,128],"decision":[8,15,44,162,172],"making":[9,163],"in":[10,101,116,174],"organizations,":[11],"consisting":[12],"of":[13,93,124],"the":[14,24,48,80,91,94,114,122,129,154,157,161],"problem,":[16],"what":[17],"decisions":[18],"were":[19],"made,":[20],"and":[21,38,79,139,156],"how":[22],"desirable":[23],"outcomes":[25],"were.":[26],"Using":[27],"this":[28,102],"data,":[29],"it":[30,110],"possible":[32,111],"to":[33,89,104,112,171],"learn":[34],"a":[35,43,53,68,72,83,168],"surrogate":[36,64,95,155],"model,":[37,41],"with":[39,76],"that":[40,46,86],"evolve":[42],"strategy":[45,81,158],"optimizes":[47],"outcomes.":[49],"This":[50],"paper":[51,103],"introduces":[52],"general":[54],"such":[55],"approach,":[56],"called":[57],"Evolutionary":[58],"Surrogate-Assisted":[59],"Prescription,":[60],"or":[61,71],"ESP.":[62],"The":[63],"is,":[65],"for":[66],"example,":[67],"random":[69],"forest":[70],"neural":[73,84],"network":[74,85,159],"trained":[75],"gradient":[77],"descent,":[78],"evolved":[88],"maximize":[90],"predictions":[92],"model.":[96],"ESP":[97,131,165],"further":[99],"extended":[100],"sequential":[105],"decision-making":[106],"tasks,":[107],"which":[108],"makes":[109],"evaluate":[113],"framework":[115],"reinforcement":[117],"learning":[118],"(RL)":[119],"benchmarks.":[120],"Because":[121],"majority":[123],"evaluations":[125],"are":[126,149],"done":[127],"surrogate,":[130],"more":[133],"sample":[134],"efficient,":[135],"has":[136],"lower":[137,140],"variance,":[138],"regret":[141],"than":[142],"standard":[143],"RL":[144],"approaches.":[145],"Surprisingly,":[146],"its":[147],"solutions":[148],"also":[150],"better":[151],"because":[152],"both":[153],"regularize":[160],"behavior.":[164],"thus":[166],"forms":[167],"promising":[169],"foundation":[170],"optimization":[173],"real-world":[175],"problems.":[176]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
