{"id":"https://openalex.org/W3007844454","doi":"https://doi.org/10.1109/bigdata47090.2019.9006104","title":"Demystifying Learning Rate Policies for High Accuracy Training of Deep Neural Networks","display_name":"Demystifying Learning Rate Policies for High Accuracy Training of Deep Neural Networks","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3007844454","doi":"https://doi.org/10.1109/bigdata47090.2019.9006104","mag":"3007844454"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata47090.2019.9006104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060093535","display_name":"Yanzhao Wu","orcid":"https://orcid.org/0000-0001-8761-5486"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yanzhao Wu","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100343991","display_name":"Ling Liu","orcid":"https://orcid.org/0000-0002-4138-3082"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ling Liu","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100780771","display_name":"J. Alexander Bae","orcid":"https://orcid.org/0000-0002-4681-6342"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juhyun Bae","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028240524","display_name":"Ka-Ho Chow","orcid":"https://orcid.org/0000-0001-5917-2577"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ka-Ho Chow","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102744844","display_name":"Arun Iyengar","orcid":"https://orcid.org/0000-0003-4679-1920"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arun Iyengar","raw_affiliation_strings":["Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081442372","display_name":"Calton Pu","orcid":"https://orcid.org/0000-0002-6616-8987"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Calton Pu","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069331320","display_name":"Wenqi Wei","orcid":"https://orcid.org/0000-0001-9177-114X"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wenqi Wei","raw_affiliation_strings":["School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100445935","display_name":"Lei Yu","orcid":"https://orcid.org/0000-0002-9188-6112"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lei Yu","raw_affiliation_strings":["Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100665641","display_name":"Qi Zhang","orcid":"https://orcid.org/0000-0003-2942-7430"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qi Zhang","raw_affiliation_strings":["Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"Yorktown Heights, IBM Thomas. J. Watson Research, NY, USA","institution_ids":["https://openalex.org/I4210114115"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5060093535"],"corresponding_institution_ids":["https://openalex.org/I130701444"],"apc_list":null,"apc_paid":null,"fwci":7.0813,"has_fulltext":false,"cited_by_count":129,"citation_normalized_percentile":{"value":0.97577098,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1971","last_page":"1980"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8027085661888123},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7540360689163208},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6763899326324463},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6521092057228088},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.602300763130188},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6022233366966248},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5909228324890137},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.5832891464233398},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.516548752784729},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.47449421882629395},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.460449755191803},{"id":"https://openalex.org/keywords/constant","display_name":"Constant (computer programming)","score":0.4504576027393341}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8027085661888123},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7540360689163208},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6763899326324463},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6521092057228088},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.602300763130188},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6022233366966248},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5909228324890137},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.5832891464233398},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.516548752784729},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.47449421882629395},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.460449755191803},{"id":"https://openalex.org/C2777027219","wikidata":"https://www.wikidata.org/wiki/Q1284190","display_name":"Constant (computer programming)","level":2,"score":0.4504576027393341},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata47090.2019.9006104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:hub.hku.hk:10722/343296","is_oa":false,"landing_page_url":"https://hub.hku.hk/handle/10722/343296","pdf_url":null,"source":{"id":"https://openalex.org/S4377196271","display_name":"The HKU Scholars Hub (University of Hong Kong)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I889458895","host_organization_name":"University of Hong Kong","host_organization_lineage":["https://openalex.org/I889458895"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference_Paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W6908809","https://openalex.org/W60686164","https://openalex.org/W104184427","https://openalex.org/W1522301498","https://openalex.org/W1533861849","https://openalex.org/W1570413585","https://openalex.org/W1806891645","https://openalex.org/W1814095264","https://openalex.org/W1955857676","https://openalex.org/W1980287119","https://openalex.org/W2112796928","https://openalex.org/W2120420045","https://openalex.org/W2146502635","https://openalex.org/W2155893237","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2518108298","https://openalex.org/W2523246573","https://openalex.org/W2622263826","https://openalex.org/W2883457665","https://openalex.org/W2898496135","https://openalex.org/W2912801804","https://openalex.org/W2949676527","https://openalex.org/W2951650375","https://openalex.org/W2962931450","https://openalex.org/W2963263347","https://openalex.org/W2963363373","https://openalex.org/W2963587345","https://openalex.org/W2964050365","https://openalex.org/W2964054038","https://openalex.org/W2964121744","https://openalex.org/W3106099468","https://openalex.org/W4290728118","https://openalex.org/W4300900294","https://openalex.org/W6600284362","https://openalex.org/W6604254268","https://openalex.org/W6631190155","https://openalex.org/W6631943919","https://openalex.org/W6634326774","https://openalex.org/W6638524475","https://openalex.org/W6677872732","https://openalex.org/W6681435938","https://openalex.org/W6684191040","https://openalex.org/W6726497184","https://openalex.org/W6727249380","https://openalex.org/W6729210268","https://openalex.org/W6739622702","https://openalex.org/W6743178762"],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W4377865163","https://openalex.org/W3193857078","https://openalex.org/W2888956734","https://openalex.org/W3000197790","https://openalex.org/W4315865067","https://openalex.org/W3208304128","https://openalex.org/W2979433843"],"abstract_inverted_index":{"Learning":[0],"Rate":[1],"(LR)":[2],"is":[3,27],"an":[4,123,153],"important":[5],"hyper-parameter":[6],"to":[7,29,67,134,159,173],"tune":[8],"for":[9,18,35,104,144,193],"effective":[10,186],"training":[11,36,53,145],"of":[12,21,45,51,77,102,164,177],"deep":[13,156],"neural":[14],"networks":[15],"(DNNs).":[16],"Even":[17],"the":[19,52,111,161,175],"baseline":[20],"a":[22,31,37,74,100],"constant":[23,33],"learning":[24,40,79,157],"rate,":[25],"it":[26],"non-trivial":[28],"choose":[30],"good":[32,136,182],"value":[34,95,188],"DNN.":[38],"Dynamic":[39],"rates":[41],"involve":[42],"multi-step":[43],"tuning":[44,162,176],"LR":[46,85,108,124,137,142,165,178,183,187,194],"values":[47],"at":[48],"various":[49],"stages":[50],"process":[54],"and":[55,59,82,94,106,116,118,131,139,190],"offer":[56],"high":[57],"accuracy":[58],"fast":[60],"convergence.":[61],"However,":[62],"they":[63],"are":[64],"much":[65],"harder":[66],"tune.":[68],"In":[69],"this":[70],"paper,":[71],"we":[72,171],"present":[73],"comprehensive":[75],"study":[76],"13":[78],"rate":[80],"functions":[81],"their":[83,89,146],"associated":[84],"policies":[86,138,143,179,184],"by":[87,180],"examining":[88],"range":[90],"parameters,":[91,93],"step":[92,191],"update":[96,195],"parameters.":[97],"We":[98,148],"propose":[99],"set":[101],"metrics":[103],"evaluating":[105],"selecting":[107],"policies,":[109],"including":[110],"classification":[112],"confidence,":[113],"variance,":[114],"cost,":[115],"robustness,":[117],"implement":[119],"them":[120],"in":[121],"LRBench,":[122],"benchmarking":[125],"system.":[126],"LRBench":[127,150],"can":[128],"assist":[129],"end-users":[130],"DNN":[132],"developers":[133],"select":[135],"avoid":[140],"bad":[141],"DNNs.":[147],"tested":[149],"on":[151],"Caffe,":[152],"open":[154],"source":[155],"framework,":[158],"showcase":[160],"optimization":[163],"policies.":[166],"Evaluated":[167],"through":[168],"extensive":[169],"experiments,":[170],"attempt":[172],"demystify":[174],"identifying":[181],"with":[185],"ranges":[189],"sizes":[192],"schedules.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":22},{"year":2024,"cited_by_count":32},{"year":2023,"cited_by_count":22},{"year":2022,"cited_by_count":22},{"year":2021,"cited_by_count":21},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":2}],"updated_date":"2026-03-17T09:09:15.849793","created_date":"2025-10-10T00:00:00"}
