{"id":"https://openalex.org/W3176111259","doi":"https://doi.org/10.1145/3449639.3459292","title":"Regularized evolutionary population-based training","display_name":"Regularized evolutionary population-based training","publication_year":2021,"publication_date":"2021-06-21","ids":{"openalex":"https://openalex.org/W3176111259","doi":"https://doi.org/10.1145/3449639.3459292","mag":"3176111259"},"language":"en","primary_location":{"id":"doi:10.1145/3449639.3459292","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3449639.3459292","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042555985","display_name":"Jason Liang","orcid":"https://orcid.org/0009-0007-9980-5077"},"institutions":[{"id":"https://openalex.org/I163361683","display_name":"Cognizant (United States)","ror":"https://ror.org/036s7bw54","country_code":"US","type":"company","lineage":["https://openalex.org/I163361683"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jason Liang","raw_affiliation_strings":["Cognizant AI Labs"],"affiliations":[{"raw_affiliation_string":"Cognizant AI Labs","institution_ids":["https://openalex.org/I163361683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066709653","display_name":"Santiago Gonz\u00e1lez","orcid":"https://orcid.org/0000-0001-5685-4580"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Santiago Gonzalez","raw_affiliation_strings":["The Univ. of Texas at Austin"],"affiliations":[{"raw_affiliation_string":"The Univ. of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034397027","display_name":"Hormoz Shahrzad","orcid":"https://orcid.org/0000-0002-5983-4531"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hormoz Shahrzad","raw_affiliation_strings":["The Univ. of Texas at Austin"],"affiliations":[{"raw_affiliation_string":"The Univ. of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020441009","display_name":"Risto Miikkulainen","orcid":"https://orcid.org/0000-0002-0062-0037"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Risto Miikkulainen","raw_affiliation_strings":["The Univ. of Texas at Austin"],"affiliations":[{"raw_affiliation_string":"The Univ. of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5042555985"],"corresponding_institution_ids":["https://openalex.org/I163361683"],"apc_list":null,"apc_paid":null,"fwci":1.1417,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.8138288,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"323","last_page":"331"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7361059188842773},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6701613068580627},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.6656464338302612},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6001290678977966},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5109378695487976},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.48390325903892517},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.42954131960868835},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.37149864435195923}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7361059188842773},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6701613068580627},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.6656464338302612},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6001290678977966},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5109378695487976},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.48390325903892517},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.42954131960868835},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.37149864435195923},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3449639.3459292","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3449639.3459292","pdf_url":null,"source":{"id":"https://openalex.org/S4363608932","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1499536210","https://openalex.org/W1569757501","https://openalex.org/W1677182931","https://openalex.org/W2101677491","https://openalex.org/W2145339207","https://openalex.org/W2154022540","https://openalex.org/W2335728318","https://openalex.org/W2593744649","https://openalex.org/W2794046125","https://openalex.org/W2889965839","https://openalex.org/W2906697496","https://openalex.org/W2947805651","https://openalex.org/W2950182411","https://openalex.org/W2963446712","https://openalex.org/W2963474950","https://openalex.org/W2964081807","https://openalex.org/W2965658867","https://openalex.org/W2992308087","https://openalex.org/W3100814079","https://openalex.org/W3118608800","https://openalex.org/W4212774754","https://openalex.org/W4246352495"],"related_works":["https://openalex.org/W4298369531","https://openalex.org/W3155135229","https://openalex.org/W2989932438","https://openalex.org/W4285827128","https://openalex.org/W3198113463","https://openalex.org/W4387297750","https://openalex.org/W2602382373","https://openalex.org/W2787698406","https://openalex.org/W2963844355","https://openalex.org/W2186333919"],"abstract_inverted_index":{"Metalearning":[0],"of":[1,15,33,38,87,94,112,182],"deep":[2],"neural":[3],"network":[4,21],"(DNN)":[5],"architectures":[6],"and":[7,114,120,143,163],"hyperparameters":[8,157],"has":[9,23,44],"become":[10],"an":[11,67,76],"increasingly":[12],"important":[13],"area":[14],"research.":[16],"At":[17],"the":[18,36,85,92,141,160,167,174],"same":[19],"time,":[20],"regularization":[22,43,183],"been":[24,47],"recognized":[25],"as":[26,66,130,132],"a":[27,88,124,179],"crucial":[28],"dimension":[29],"to":[30,70,135,159,165,173],"effective":[31,42],"training":[32,86,161],"DNNs.":[34],"However,":[35],"role":[37],"metalearning":[39,93,184],"in":[40,150],"establishing":[41],"not":[45],"yet":[46],"fully":[48],"explored.":[49],"There":[50],"is":[51,63],"recent":[52],"evidence":[53],"that":[54,83,104],"loss-function":[55],"optimization":[56],"could":[57],"play":[58],"this":[59],"role,":[60],"however":[61],"it":[62],"computationally":[64],"impractical":[65],"outer":[68],"loop":[69],"full":[71],"training.":[72,139,188],"This":[73],"paper":[74],"presents":[75],"algorithm":[77],"called":[78,127],"Evolutionary":[79],"Population-Based":[80],"Training":[81],"(EPBT)":[82],"interleaves":[84],"DNN's":[89],"weights":[90,113],"with":[91],"loss":[95,115],"functions.":[96],"They":[97],"are":[98],"parameterized":[99],"using":[100],"multivariate":[101],"Taylor":[102],"expansions":[103],"EPBT":[105,122,148,176],"can":[106,117],"directly":[107],"optimize.":[108],"Such":[109],"simultaneous":[110,187],"adaptation":[111],"functions":[116],"be":[118],"deceptive,":[119],"therefore":[121],"uses":[123],"quality-diversity":[125],"heuristic":[126],"Novelty":[128],"Pulsation":[129],"well":[131],"knowledge":[133],"distillation":[134],"prevent":[136],"overfitting":[137,172],"during":[138],"On":[140],"CIFAR-10":[142],"SVHN":[144],"image":[145],"classification":[146],"benchmarks,":[147],"results":[149],"faster,":[151],"more":[152],"accurate":[153],"learning.":[154],"The":[155],"discovered":[156],"adapt":[158],"process":[162],"serve":[164],"regularize":[166],"learning":[168],"task":[169],"by":[170],"discouraging":[171],"labels.":[175],"thus":[177],"demonstrates":[178],"practical":[180],"instantiation":[181],"based":[185],"on":[186]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-06T07:47:59.780226","created_date":"2025-10-10T00:00:00"}
