{"id":"https://openalex.org/W2807087769","doi":"https://doi.org/10.1145/3195106.3195150","title":"Batch Normalization","display_name":"Batch Normalization","publication_year":2018,"publication_date":"2018-02-26","ids":{"openalex":"https://openalex.org/W2807087769","doi":"https://doi.org/10.1145/3195106.3195150","mag":"2807087769"},"language":"en","primary_location":{"id":"doi:10.1145/3195106.3195150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3195106.3195150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 10th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100322712","display_name":"Yan Wang","orcid":"https://orcid.org/0000-0002-5344-1884"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yan Wang","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029552346","display_name":"Xiaofu Wu","orcid":"https://orcid.org/0000-0002-9861-331X"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaofu Wu","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030348326","display_name":"Yuanyuan Chang","orcid":"https://orcid.org/0000-0001-8562-3781"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyuan Chang","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072562533","display_name":"Suofei Zhang","orcid":"https://orcid.org/0000-0003-4116-7555"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Suofei Zhang","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087193137","display_name":"Quan Zhou","orcid":"https://orcid.org/0000-0002-7894-7929"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan Zhou","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101781340","display_name":"Jun Yan","orcid":"https://orcid.org/0000-0001-7113-0249"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Yan","raw_affiliation_strings":["Nanjing University of Posts and Telecommunications, Nanjing, CHINA"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Posts and Telecommunications, Nanjing, CHINA","institution_ids":["https://openalex.org/I41198531"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100322712"],"corresponding_institution_ids":["https://openalex.org/I41198531"],"apc_list":null,"apc_paid":null,"fwci":0.3134,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.60886876,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"36","last_page":"40"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.8694531917572021},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.764198899269104},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7174963355064392},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6117199659347534},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.559199333190918},{"id":"https://openalex.org/keywords/linearity","display_name":"Linearity","score":0.5356712937355042},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4370570182800293},{"id":"https://openalex.org/keywords/invertible-matrix","display_name":"Invertible matrix","score":0.43575519323349},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4260748624801636},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.41948583722114563},{"id":"https://openalex.org/keywords/standard-deviation","display_name":"Standard deviation","score":0.41810840368270874},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38550636172294617},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33255529403686523},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12324744462966919},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.0829516053199768},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07914763689041138},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.0750100314617157}],"concepts":[{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.8694531917572021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.764198899269104},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7174963355064392},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6117199659347534},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.559199333190918},{"id":"https://openalex.org/C77170095","wikidata":"https://www.wikidata.org/wiki/Q1753188","display_name":"Linearity","level":2,"score":0.5356712937355042},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4370570182800293},{"id":"https://openalex.org/C96442724","wikidata":"https://www.wikidata.org/wiki/Q242188","display_name":"Invertible matrix","level":2,"score":0.43575519323349},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4260748624801636},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.41948583722114563},{"id":"https://openalex.org/C22679943","wikidata":"https://www.wikidata.org/wiki/Q159375","display_name":"Standard deviation","level":2,"score":0.41810840368270874},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38550636172294617},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33255529403686523},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12324744462966919},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0829516053199768},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07914763689041138},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.0750100314617157},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3195106.3195150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3195106.3195150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 10th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W569478347","https://openalex.org/W1487583988","https://openalex.org/W1836465849","https://openalex.org/W2004915807","https://openalex.org/W2064675550","https://openalex.org/W2073817609","https://openalex.org/W2095705004","https://openalex.org/W2123045220","https://openalex.org/W2147800946","https://openalex.org/W2194775991","https://openalex.org/W2284050935","https://openalex.org/W2559655401","https://openalex.org/W2963542991","https://openalex.org/W3118608800"],"related_works":["https://openalex.org/W4251428025","https://openalex.org/W2784467519","https://openalex.org/W4289867043","https://openalex.org/W2366459771","https://openalex.org/W2591697403","https://openalex.org/W4287755480","https://openalex.org/W3113607506","https://openalex.org/W4297779039","https://openalex.org/W2898211994","https://openalex.org/W3000197790"],"abstract_inverted_index":{"The":[0],"state-of-the-art":[1],"training":[2,18,43,82,109,154],"of":[3,12,41,74,83,155],"deep":[4,86,157],"neural":[5,87,129,158],"networks":[6],"requires":[7,150],"to":[8,24],"normalize":[9],"the":[10,13,17,31,36,42,60,65,72,81,118,122],"activities":[11],"neurons":[14],"for":[15,132,145,153],"accelerating":[16],"process.":[19],"A":[20],"standard":[21,39,133],"approach":[22],"is":[23,103],"employ":[25],"batch":[26],"normalization":[27,61],"(BN),":[28],"in":[29,107],"which":[30,56],"activations":[32],"are":[33,57],"normalized":[34],"by":[35],"mean":[37],"and":[38,54,78,111],"deviation":[40],"mini-batch.":[44],"To":[45],"be":[46],"invertible,":[47],"BN":[48,119,146],"also":[49,137],"introduces":[50],"an":[51],"adaptive":[52],"gain":[53,77],"bias":[55],"applied":[58],"after":[59],"but":[62],"often":[63,149],"before":[64],"non-linearity.":[66],"In":[67,92],"this":[68],"paper,":[69],"we":[70,99,116],"investigate":[71],"effects":[73],"learnable":[75,143],"parameters,":[76],"bias,":[79],"on":[80],"various":[84],"typical":[85],"nets,":[88],"including":[89],"ALL-CNNs,":[90],"Network":[91,93],"(NIN),":[94],"ResNets.":[95],"Through":[96],"extensive":[97],"experiments,":[98],"show":[100],"that":[101,139],"there":[102],"no":[104],"big":[105],"difference":[106],"both":[108],"convergence":[110],"final":[112,123],"test":[113],"accuracy":[114],"if":[115],"remove":[117],"layer":[120,125],"following":[121],"convolutional":[124,128],"from":[126],"a":[127],"network":[130],"(CNN)":[131],"classification":[134],"tasks.":[135],"We":[136],"observed":[138],"without":[140],"adaptively":[141],"updating":[142],"parameters":[144],"layers,":[147],"it":[148],"less":[151],"time":[152],"very":[156],"nets":[159],"such":[160],"as":[161],"ResNet-101.":[162]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
