{"id":"https://openalex.org/W2964374138","doi":"https://doi.org/10.1145/3352020.3352029","title":"Taming Hyper-parameters in Deep Learning Systems","display_name":"Taming Hyper-parameters in Deep Learning Systems","publication_year":2019,"publication_date":"2019-07-25","ids":{"openalex":"https://openalex.org/W2964374138","doi":"https://doi.org/10.1145/3352020.3352029","mag":"2964374138"},"language":"en","primary_location":{"id":"doi:10.1145/3352020.3352029","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3352020.3352029","pdf_url":null,"source":{"id":"https://openalex.org/S50071195","display_name":"ACM SIGOPS Operating Systems Review","issn_l":"0163-5980","issn":["0163-5980","1943-586X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGOPS Operating Systems Review","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101924633","display_name":"Luo Mai","orcid":"https://orcid.org/0000-0002-7712-7558"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Luo Mai","raw_affiliation_strings":["Imperial College London, London, England UK"],"affiliations":[{"raw_affiliation_string":"Imperial College London, London, England UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017388015","display_name":"Alexandros Koliousis","orcid":"https://orcid.org/0000-0003-3006-9802"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alexandros Koliousis","raw_affiliation_strings":["Imperial College London, London, England UK"],"affiliations":[{"raw_affiliation_string":"Imperial College London, London, England UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100675165","display_name":"Li Guo","orcid":"https://orcid.org/0000-0002-9723-3294"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Guo Li","raw_affiliation_strings":["Imperial College London, London, England UK"],"affiliations":[{"raw_affiliation_string":"Imperial College London, London, England UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087572508","display_name":"Andrei-Octavian Brabete","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrei-Octavian Brabete","raw_affiliation_strings":["Imperial College London, London, England UK"],"affiliations":[{"raw_affiliation_string":"Imperial College London, London, England UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078842469","display_name":"Peter Pietzuch","orcid":"https://orcid.org/0000-0002-6963-5640"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Peter Pietzuch","raw_affiliation_strings":["Imperial College London, London, England UK"],"affiliations":[{"raw_affiliation_string":"Imperial College London, London, England UK","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101924633"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":null,"apc_paid":null,"fwci":1.6802,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.88315846,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"53","issue":"1","first_page":"52","last_page":"58"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8868011236190796},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.7233699560165405},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5659096240997314},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5630945563316345},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4974861443042755},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.37164318561553955},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3293563425540924},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.20203959941864014}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8868011236190796},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.7233699560165405},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5659096240997314},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5630945563316345},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4974861443042755},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.37164318561553955},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3293563425540924},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.20203959941864014}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3352020.3352029","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3352020.3352029","pdf_url":null,"source":{"id":"https://openalex.org/S50071195","display_name":"ACM SIGOPS Operating Systems Review","issn_l":"0163-5980","issn":["0163-5980","1943-586X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGOPS Operating Systems Review","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W59018853","https://openalex.org/W1841592590","https://openalex.org/W1988720110","https://openalex.org/W1994616650","https://openalex.org/W2083842231","https://openalex.org/W2086161653","https://openalex.org/W2108598243","https://openalex.org/W2132211083","https://openalex.org/W2136836265","https://openalex.org/W2155894447","https://openalex.org/W2168231600","https://openalex.org/W2186615578","https://openalex.org/W2427527485","https://openalex.org/W2513383847","https://openalex.org/W2559655401","https://openalex.org/W2584555500","https://openalex.org/W2597452529","https://openalex.org/W2604272474","https://openalex.org/W2612690371","https://openalex.org/W2622263826","https://openalex.org/W2625885504","https://openalex.org/W2749988060","https://openalex.org/W2766164908","https://openalex.org/W2774000609","https://openalex.org/W2783444794","https://openalex.org/W2785456003","https://openalex.org/W2799042347","https://openalex.org/W2809899846","https://openalex.org/W2884711234","https://openalex.org/W2896457183","https://openalex.org/W2900103278","https://openalex.org/W2912500072","https://openalex.org/W2913059114","https://openalex.org/W2914037279","https://openalex.org/W2930786691","https://openalex.org/W2949650786","https://openalex.org/W2950182411","https://openalex.org/W2963433607","https://openalex.org/W2963933775","https://openalex.org/W2963959597","https://openalex.org/W2970139027","https://openalex.org/W6601968593"],"related_works":["https://openalex.org/W2120447654","https://openalex.org/W2977179488","https://openalex.org/W2144453115","https://openalex.org/W2128223750","https://openalex.org/W4238532390","https://openalex.org/W2188872161","https://openalex.org/W2002978035","https://openalex.org/W2961779879","https://openalex.org/W797688974","https://openalex.org/W4380075502"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"(DL)":[2],"systems":[3,40],"expose":[4],"many":[5],"tuning":[6,32],"parameters":[7],"(\"hyper-parameters\")":[8],"that":[9,37,100,108],"affect":[10],"the":[11,58,102],"performance":[12,64],"and":[13,24,65,77],"accuracy":[14],"of":[15,28,60,104],"trained":[16],"models.":[17],"Increasingly":[18],"users":[19],"struggle":[20],"to":[21,44,71],"configure":[22],"hyper-parameters,":[23,86],"a":[25,51,74],"substantial":[26],"portion":[27],"time":[29],"is":[30],"spent":[31],"them":[33],"empirically.":[34],"We":[35,48,94],"argue":[36],"future":[38],"DL":[39,53,105],"should":[41],"be":[42],"designed":[43],"help":[45],"manage":[46],"hyper-parameters.":[47],"describe":[49],"how":[50],"distributed":[52],"system":[54,106],"can":[55],"(i)":[56],"remove":[57],"impact":[59],"hyper-parameters":[61],"on":[62,73],"both":[63],"accuracy,":[66],"thus":[67],"making":[68],"it":[69],"easier":[70],"decide":[72],"good":[75],"setting,":[76],"(ii)":[78],"support":[79],"more":[80],"powerful":[81],"dynamic":[82],"policies":[83],"for":[84],"adapting":[85],"which":[87],"take":[88],"monitored":[89],"training":[90],"metrics":[91],"into":[92],"account.":[93],"report":[95],"results":[96],"from":[97],"prototype":[98],"implementations":[99],"show":[101],"practicality":[103],"designs":[107],"are":[109],"hyper-parameter-friendly.":[110]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
