{"id":"https://openalex.org/W4387996879","doi":"https://doi.org/10.1109/tnnls.2023.3325541","title":"A Robust Initialization of Residual Blocks for Effective ResNet Training Without Batch Normalization","display_name":"A Robust Initialization of Residual Blocks for Effective ResNet Training Without Batch Normalization","publication_year":2023,"publication_date":"2023-10-27","ids":{"openalex":"https://openalex.org/W4387996879","doi":"https://doi.org/10.1109/tnnls.2023.3325541","pmid":"https://pubmed.ncbi.nlm.nih.gov/37889824"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3325541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3325541","pdf_url":"https://ieeexplore.ieee.org/ielx7/5962385/6104215/10298277.pdf","source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/5962385/6104215/10298277.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026131161","display_name":"Enrico Civitelli","orcid":"https://orcid.org/0000-0001-5322-4831"},"institutions":[{"id":"https://openalex.org/I45084792","display_name":"University of Florence","ror":"https://ror.org/04jr1s763","country_code":"IT","type":"education","lineage":["https://openalex.org/I45084792"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Enrico Civitelli","raw_affiliation_strings":["Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy","institution_ids":["https://openalex.org/I45084792"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009013106","display_name":"Alessio Sortino","orcid":"https://orcid.org/0000-0002-3971-3441"},"institutions":[{"id":"https://openalex.org/I45084792","display_name":"University of Florence","ror":"https://ror.org/04jr1s763","country_code":"IT","type":"education","lineage":["https://openalex.org/I45084792"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessio Sortino","raw_affiliation_strings":["Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy","institution_ids":["https://openalex.org/I45084792"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037874811","display_name":"Matteo Lapucci","orcid":"https://orcid.org/0000-0002-2488-5486"},"institutions":[{"id":"https://openalex.org/I45084792","display_name":"University of Florence","ror":"https://ror.org/04jr1s763","country_code":"IT","type":"education","lineage":["https://openalex.org/I45084792"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Matteo Lapucci","raw_affiliation_strings":["Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy","institution_ids":["https://openalex.org/I45084792"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049843644","display_name":"Francesco Bagattini","orcid":"https://orcid.org/0000-0003-1645-1749"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Francesco Bagattini","raw_affiliation_strings":["Flair-Tech, Florence, Italy"],"affiliations":[{"raw_affiliation_string":"Flair-Tech, Florence, Italy","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073824203","display_name":"Giulio Galvan","orcid":"https://orcid.org/0000-0002-0384-0334"},"institutions":[{"id":"https://openalex.org/I45084792","display_name":"University of Florence","ror":"https://ror.org/04jr1s763","country_code":"IT","type":"education","lineage":["https://openalex.org/I45084792"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giulio Galvan","raw_affiliation_strings":["Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy","Flair-Tech, Florence, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Ingegneria dell&#x2019;Informazione, Universit&#x00E0; di Firenze, Florence, Italy","institution_ids":["https://openalex.org/I45084792"]},{"raw_affiliation_string":"Flair-Tech, Florence, Italy","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5026131161"],"corresponding_institution_ids":["https://openalex.org/I45084792"],"apc_list":null,"apc_paid":null,"fwci":0.6105,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.70219075,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"36","issue":"1","first_page":"1947","last_page":"1952"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.9130455851554871},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.8780276775360107},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7638648152351379},{"id":"https://openalex.org/keywords/residual-neural-network","display_name":"Residual neural network","score":0.760542631149292},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.6609789133071899},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.6518999338150024},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49738767743110657},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4683617353439331},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4436168968677521},{"id":"https://openalex.org/keywords/network-architecture","display_name":"Network architecture","score":0.4258997142314911},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4219492971897125},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.36690694093704224},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3416327238082886},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33928871154785156},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.09505021572113037}],"concepts":[{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.9130455851554871},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.8780276775360107},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7638648152351379},{"id":"https://openalex.org/C2944601119","wikidata":"https://www.wikidata.org/wiki/Q43744058","display_name":"Residual neural network","level":3,"score":0.760542631149292},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.6609789133071899},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.6518999338150024},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49738767743110657},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4683617353439331},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4436168968677521},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.4258997142314911},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4219492971897125},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.36690694093704224},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3416327238082886},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33928871154785156},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.09505021572113037},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2023.3325541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3325541","pdf_url":"https://ieeexplore.ieee.org/ielx7/5962385/6104215/10298277.pdf","source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37889824","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37889824","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:flore.unifi.it:2158/1342851","is_oa":true,"landing_page_url":"https://hdl.handle.net/2158/1342851","pdf_url":"https://flore.unifi.it/bitstream/2158/1342851/2/A_Robust_Initialization_of_Residual_Blocks_for_Effective_ResNet_Training_Without_Batch_Normalization.pdf","source":{"id":"https://openalex.org/S4306402033","display_name":"Florence Research (University of Florence)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45084792","host_organization_name":"University of Florence","host_organization_lineage":["https://openalex.org/I45084792"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1109/tnnls.2023.3325541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3325541","pdf_url":"https://ieeexplore.ieee.org/ielx7/5962385/6104215/10298277.pdf","source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.4399999976158142,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387996879.pdf","grobid_xml":"https://content.openalex.org/works/W4387996879.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W1533861849","https://openalex.org/W1677182931","https://openalex.org/W1836465849","https://openalex.org/W2108598243","https://openalex.org/W2114279993","https://openalex.org/W2194775991","https://openalex.org/W2292729293","https://openalex.org/W2302255633","https://openalex.org/W2617242334","https://openalex.org/W2780149736","https://openalex.org/W2789027062","https://openalex.org/W2948227433","https://openalex.org/W2952258850","https://openalex.org/W2963263347","https://openalex.org/W2970674435","https://openalex.org/W2995333370","https://openalex.org/W2998655644","https://openalex.org/W3004591935","https://openalex.org/W3010768098","https://openalex.org/W3035682985","https://openalex.org/W3035794324","https://openalex.org/W3043569052","https://openalex.org/W3048030262","https://openalex.org/W3093643905","https://openalex.org/W3098912370","https://openalex.org/W3108417339","https://openalex.org/W3118608800","https://openalex.org/W3128633047","https://openalex.org/W3132672614","https://openalex.org/W3173196825","https://openalex.org/W4295312788","https://openalex.org/W4295773261","https://openalex.org/W6631943919","https://openalex.org/W6726497184","https://openalex.org/W6738534199","https://openalex.org/W6749897870","https://openalex.org/W6754615192","https://openalex.org/W6762974433","https://openalex.org/W6767340034","https://openalex.org/W6771763659","https://openalex.org/W6774776664","https://openalex.org/W6779724054","https://openalex.org/W6781575362","https://openalex.org/W6785989746","https://openalex.org/W6787972765","https://openalex.org/W6788627230","https://openalex.org/W6790428460"],"related_works":["https://openalex.org/W4226466875","https://openalex.org/W2977257638","https://openalex.org/W4288095186","https://openalex.org/W2755231872","https://openalex.org/W3210541621","https://openalex.org/W4287755480","https://openalex.org/W3113607506","https://openalex.org/W4297779039","https://openalex.org/W2898211994","https://openalex.org/W2604237878"],"abstract_inverted_index":{"Batch":[0],"normalization":[1],"is":[2,37,68],"an":[3],"essential":[4],"component":[5],"of":[6,55],"all":[7],"state-of-the-art":[8],"neural":[9],"networks":[10],"architectures.":[11,28],"However,":[12],"since":[13],"it":[14],"introduces":[15],"many":[16],"practical":[17],"issues,":[18],"much":[19],"recent":[20],"research":[21],"has":[22],"been":[23],"devoted":[24],"to":[25,39,51,59],"designing":[26],"normalization-free":[27,42],"In":[29,44],"this":[30,74],"brief,":[31],"we":[32,46],"show":[33,72],"that":[34,64,73],"weights":[35],"initialization":[36],"key":[38],"train":[40],"ResNet-like":[41],"networks.":[43],"particular,":[45],"propose":[47],"a":[48,56],"slight":[49],"modification":[50],"the":[52,60,65],"summation":[53],"operation":[54],"block":[57],"output":[58],"skip-connection":[61],"branch,":[62],"so":[63],"whole":[66],"network":[67],"correctly":[69],"initialized.":[70],"We":[71],"modified":[75],"architecture":[76],"achieves":[77],"competitive":[78],"results":[79],"on":[80],"CIFAR-10,":[81],"CIFAR-100":[82],"and":[83],"ImageNet":[84],"without":[85],"further":[86],"regularization":[87],"nor":[88],"algorithmic":[89],"modifications.":[90]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-16T09:10:04.655348","created_date":"2025-10-10T00:00:00"}
