{"id":"https://openalex.org/W4391436329","doi":"https://doi.org/10.1145/3643860","title":"Guidelines for the Regularization of Gammas in Batch Normalization for Deep Residual Networks","display_name":"Guidelines for the Regularization of Gammas in Batch Normalization for Deep Residual Networks","publication_year":2024,"publication_date":"2024-02-01","ids":{"openalex":"https://openalex.org/W4391436329","doi":"https://doi.org/10.1145/3643860"},"language":"en","primary_location":{"id":"doi:10.1145/3643860","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3643860","pdf_url":null,"source":{"id":"https://openalex.org/S2492086750","display_name":"ACM Transactions on Intelligent Systems and Technology","issn_l":"2157-6904","issn":["2157-6904","2157-6912"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Intelligent Systems and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100666999","display_name":"Bum Jun Kim","orcid":"https://orcid.org/0000-0003-4155-9225"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Bum Jun Kim","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang, Republic of Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024905192","display_name":"Hyeyeon Choi","orcid":"https://orcid.org/0000-0001-8221-2338"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyeyeon Choi","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang, Republic of Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074023735","display_name":"Hyeonah Jang","orcid":"https://orcid.org/0000-0001-5344-8114"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyeonah Jang","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang, Republic of Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100452155","display_name":"Sang Woo Kim","orcid":"https://orcid.org/0000-0001-6023-1837"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sang Woo Kim","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang, Republic of Korea","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100666999"],"corresponding_institution_ids":["https://openalex.org/I123900574"],"apc_list":null,"apc_paid":null,"fwci":0.7873,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.69623264,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"15","issue":"3","first_page":"1","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.7893993854522705},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.782825767993927},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.7598522901535034},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.7156277894973755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4952811300754547},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4679008722305298},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4436795115470886},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.42428505420684814},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38456788659095764},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3655356764793396},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1790294647216797}],"concepts":[{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.7893993854522705},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.782825767993927},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7598522901535034},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.7156277894973755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4952811300754547},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4679008722305298},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4436795115470886},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.42428505420684814},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38456788659095764},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3655356764793396},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1790294647216797},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3643860","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3643860","pdf_url":null,"source":{"id":"https://openalex.org/S2492086750","display_name":"ACM Transactions on Intelligent Systems and Technology","issn_l":"2157-6904","issn":["2157-6904","2157-6912"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Intelligent Systems and Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8190979439","display_name":null,"funder_award_id":"IO201210-08019-01","funder_id":"https://openalex.org/F4320332195","funder_display_name":"Samsung"}],"funders":[{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2622263826","https://openalex.org/W2626017178","https://openalex.org/W2884711234","https://openalex.org/W2888685797","https://openalex.org/W2974291863","https://openalex.org/W3124219615","https://openalex.org/W4200409985","https://openalex.org/W4238100585","https://openalex.org/W4308437157","https://openalex.org/W4308445188"],"related_works":["https://openalex.org/W2591697403","https://openalex.org/W2944728705","https://openalex.org/W2904022177","https://openalex.org/W2359348847","https://openalex.org/W3011538607","https://openalex.org/W4297807321","https://openalex.org/W4287755480","https://openalex.org/W3113607506","https://openalex.org/W4297779039","https://openalex.org/W4220659530"],"abstract_inverted_index":{"L":[0,38,65,116,133,147],"2":[1,39,66,117,134,148],"regularization":[2,40,67,118,135,149],"for":[3,41,68,123],"weights":[4],"in":[5,50],"neural":[6],"networks":[7,181],"is":[8,48,70,160],"widely":[9],"used":[10],"as":[11,33],"a":[12,34],"standard":[13],"training":[14],"trick.":[15],"In":[16,59,126],"addition":[17],"to":[18,83,114,136,141,150,155],"weights,":[19],"the":[20,55,85,98,109],"use":[21],"of":[22,100,179],"batch":[23],"normalization":[24],"involves":[25],"an":[26,44,90],"additional":[27],"trainable":[28],"parameter":[29],"\u03b3,":[30],"which":[31,159],"acts":[32],"scaling":[35],"factor.":[36],"However,":[37],"\u03b3":[42,69,113,138,152],"remains":[43],"undiscussed":[45],"mystery":[46],"and":[47,57,93,111,119,175,182],"applied":[49],"different":[51],"ways":[52],"depending":[53],"on":[54],"library":[56],"practitioner.":[58],"this":[60,74],"article,":[61],"we":[62,76,107,129],"study":[63],"whether":[64],"valid.":[71],"To":[72],"explore":[73],"issue,":[75],"consider":[77],"two":[78,105],"approaches:":[79],"(1)":[80],"variance":[81],"control":[82],"make":[84],"residual":[86,180],"network":[87],"behave":[88],"like":[89],"identity":[91],"mapping":[92],"(2)":[94],"stable":[95],"optimization":[96],"through":[97,172],"improvement":[99],"effective":[101],"learning":[102],"rate.":[103],"Through":[104],"analyses,":[106],"specify":[108],"desirable":[110],"undesirable":[112],"apply":[115],"propose":[120],"four":[121,164],"guidelines":[122,168],"managing":[124],"them.":[125],"several":[127],"experiments,":[128],"observed":[130],"that":[131],"applying":[132,146],"applicable":[137],"increased":[139],"1%":[140,154],"4%":[142],"classification":[143,157],"accuracy,":[144,158],"whereas":[145],"inapplicable":[151],"decreased":[153],"3%":[156],"consistent":[161],"with":[162],"our":[163],"guidelines.":[165],"Our":[166],"proposed":[167],"were":[169],"further":[170],"validated":[171],"various":[173],"tasks":[174],"architectures,":[176],"including":[177],"variants":[178],"transformers.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
