{"id":"https://openalex.org/W4210928539","doi":"https://doi.org/10.1017/s135132492200002x","title":"An empirical study of cyclical learning rate on neural machine translation","display_name":"An empirical study of cyclical learning rate on neural machine translation","publication_year":2022,"publication_date":"2022-02-09","ids":{"openalex":"https://openalex.org/W4210928539","doi":"https://doi.org/10.1017/s135132492200002x"},"language":"en","primary_location":{"id":"doi:10.1017/s135132492200002x","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s135132492200002x","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101609885","display_name":"Weixuan Wang","orcid":"https://orcid.org/0000-0003-4551-0795"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weixuan Wang","raw_affiliation_strings":["Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067878144","display_name":"Choon Meng Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Choon Meng Lee","raw_affiliation_strings":["Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100335769","display_name":"Jianfeng Liu","orcid":"https://orcid.org/0000-0001-8156-223X"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianfeng Liu","raw_affiliation_strings":["Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069570906","display_name":"Talha \u00c7olako\u011flu","orcid":"https://orcid.org/0000-0002-4524-862X"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Talha Colakoglu","raw_affiliation_strings":["Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101440710","display_name":"Wei Peng","orcid":"https://orcid.org/0000-0002-0868-0974"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wei Peng","raw_affiliation_strings":["Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People\u2019s Republic of China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Artificial Intelligence Application Research Center, Huawei Technologies, Co., Ltd., Shenzhen, People's Republic of China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101440710"],"corresponding_institution_ids":["https://openalex.org/I2250955327"],"apc_list":null,"apc_paid":null,"fwci":1.1936,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.81537329,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"29","issue":"2","first_page":"316","last_page":"336"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8722683191299438},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7103042006492615},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6864987015724182},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6857302188873291},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6462775468826294},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6286888122558594},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.45578545331954956},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4410216808319092},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.07425951957702637}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8722683191299438},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7103042006492615},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6864987015724182},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6857302188873291},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6462775468826294},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6286888122558594},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.45578545331954956},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4410216808319092},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.07425951957702637},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s135132492200002x","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s135132492200002x","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W114517082","https://openalex.org/W1686810756","https://openalex.org/W1772464306","https://openalex.org/W1924770834","https://openalex.org/W2064675550","https://openalex.org/W2124807415","https://openalex.org/W2133564696","https://openalex.org/W2146502635","https://openalex.org/W2184135559","https://openalex.org/W2194775991","https://openalex.org/W2296073425","https://openalex.org/W2523060838","https://openalex.org/W2523246573","https://openalex.org/W2618530766","https://openalex.org/W2738371943","https://openalex.org/W2796108585","https://openalex.org/W2896457183","https://openalex.org/W2907225497","https://openalex.org/W2912811302","https://openalex.org/W2933138175","https://openalex.org/W2962784628","https://openalex.org/W2963446712","https://openalex.org/W2963620441","https://openalex.org/W2964054038","https://openalex.org/W3104636952","https://openalex.org/W6631190155","https://openalex.org/W6633169802","https://openalex.org/W6681435938","https://openalex.org/W6687483927","https://openalex.org/W6725739302","https://openalex.org/W6736583452","https://openalex.org/W6739901393","https://openalex.org/W6745410505","https://openalex.org/W6747381837","https://openalex.org/W6747620207","https://openalex.org/W6757053730","https://openalex.org/W6766196973","https://openalex.org/W6767164110"],"related_works":["https://openalex.org/W3176018525","https://openalex.org/W2903533908","https://openalex.org/W3026554633","https://openalex.org/W2903810591","https://openalex.org/W4289548192","https://openalex.org/W2888520903","https://openalex.org/W2903399267","https://openalex.org/W2949454572","https://openalex.org/W2952599318","https://openalex.org/W2890256614"],"abstract_inverted_index":{"Abstract":[0],"In":[1,110],"training":[2],"deep":[3],"learning":[4,10,58,69,99,118],"networks,":[5],"the":[6,38,47,53,91,96,108],"optimizer":[7],"and":[8,95],"related":[9],"rate":[11,59,70,100],"are":[12],"often":[13],"used":[14],"without":[15],"much":[16],"thought":[17],"or":[18],"with":[19],"minimal":[20],"tuning,":[21],"even":[22],"though":[23],"it":[24],"is":[25],"crucial":[26],"in":[27],"ensuring":[28],"a":[29,33,104],"fast":[30],"convergence":[31],"to":[32,61,74,120],"good":[34],"quality":[35],"minimum":[36],"of":[37,56,93],"loss":[39],"function":[40],"that":[41,90],"can":[42,71,102],"also":[43],"generalize":[44],"well":[45],"on":[46,107],"test":[48],"dataset.":[49],"Drawing":[50],"inspiration":[51],"from":[52],"successful":[54],"application":[55],"cyclical":[57,68,98,117],"policy":[60,101],"computer":[62],"vision":[63],"tasks,":[64],"we":[65,88,112],"explore":[66],"how":[67],"be":[72],"applied":[73],"train":[75],"transformer-based":[76],"neural":[77,80,121],"networks":[78],"for":[79],"machine":[81,122],"translation.":[82],"From":[83],"our":[84],"carefully":[85],"designed":[86],"experiments,":[87],"show":[89],"choice":[92],"optimizers":[94],"associated":[97],"have":[103],"significant":[105],"impact":[106],"performance.":[109],"addition,":[111],"establish":[113],"guidelines":[114],"when":[115],"applying":[116],"rates":[119],"translation":[123],"tasks.":[124]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
