{"id":"https://openalex.org/W3033960544","doi":"https://doi.org/10.1109/tnnls.2021.3069970","title":"EDropout: Energy-Based Dropout and Pruning of Deep Neural Networks","display_name":"EDropout: Energy-Based Dropout and Pruning of Deep Neural Networks","publication_year":2021,"publication_date":"2021-04-08","ids":{"openalex":"https://openalex.org/W3033960544","doi":"https://doi.org/10.1109/tnnls.2021.3069970","mag":"3033960544","pmid":"https://pubmed.ncbi.nlm.nih.gov/33830931"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2021.3069970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3069970","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2006.04270","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035444332","display_name":"Hojjat Salehinejad","orcid":"https://orcid.org/0000-0002-9636-863X"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Hojjat Salehinejad","raw_affiliation_strings":["Department of Electrical &#x0026; Computer Engineering, University of Toronto, Toronto, ON, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical &#x0026; Computer Engineering, University of Toronto, Toronto, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089951737","display_name":"Shahrokh Valaee","orcid":"https://orcid.org/0000-0001-6254-1660"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Shahrokh Valaee","raw_affiliation_strings":["Department of Electrical &#x0026; Computer Engineering, University of Toronto, Toronto, ON, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical &#x0026; Computer Engineering, University of Toronto, Toronto, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5035444332"],"corresponding_institution_ids":["https://openalex.org/I185261750"],"apc_list":null,"apc_paid":null,"fwci":4.1756,"has_fulltext":false,"cited_by_count":52,"citation_normalized_percentile":{"value":0.95297026,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"33","issue":"10","first_page":"5279","last_page":"5292"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.7744491100311279},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6532193422317505},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.620720386505127},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.5868678689002991},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5848897695541382},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.4466370642185211},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.43570172786712646},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4311271011829376},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3655480146408081},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35745975375175476}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.7744491100311279},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6532193422317505},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.620720386505127},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.5868678689002991},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5848897695541382},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.4466370642185211},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.43570172786712646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4311271011829376},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3655480146408081},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35745975375175476},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1109/tnnls.2021.3069970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3069970","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:33830931","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33830931","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:arXiv.org:2006.04270","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2006.04270","pdf_url":"https://arxiv.org/pdf/2006.04270","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2006.04270","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2006.04270","pdf_url":"https://arxiv.org/pdf/2006.04270","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.8999999761581421,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321879","display_name":"Fujitsu","ror":"https://ror.org/038e2g226"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W4919037","https://openalex.org/W6908809","https://openalex.org/W1503398984","https://openalex.org/W1513873506","https://openalex.org/W1519004125","https://openalex.org/W1523985187","https://openalex.org/W1821462560","https://openalex.org/W1826234144","https://openalex.org/W2043846600","https://openalex.org/W2095705004","https://openalex.org/W2108598243","https://openalex.org/W2114766824","https://openalex.org/W2119144962","https://openalex.org/W2133583641","https://openalex.org/W2136836265","https://openalex.org/W2156297475","https://openalex.org/W2161914416","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2276892413","https://openalex.org/W2279098554","https://openalex.org/W2294861638","https://openalex.org/W2463532758","https://openalex.org/W2533598788","https://openalex.org/W2564702731","https://openalex.org/W2570915410","https://openalex.org/W2734190907","https://openalex.org/W2746314669","https://openalex.org/W2750384547","https://openalex.org/W2891179104","https://openalex.org/W2896409484","https://openalex.org/W2902986194","https://openalex.org/W2916313152","https://openalex.org/W2943008967","https://openalex.org/W2951569836","https://openalex.org/W2951595529","https://openalex.org/W2952746978","https://openalex.org/W2962965870","https://openalex.org/W2963080758","https://openalex.org/W2964233199","https://openalex.org/W2964299589","https://openalex.org/W2970971581","https://openalex.org/W2994434574","https://openalex.org/W3003410437","https://openalex.org/W3008708068","https://openalex.org/W3011234689","https://openalex.org/W3034550700","https://openalex.org/W3118608800","https://openalex.org/W3124569721","https://openalex.org/W3162227392","https://openalex.org/W4238076109","https://openalex.org/W4287997702","https://openalex.org/W4288364646","https://openalex.org/W4294170691","https://openalex.org/W4297775537","https://openalex.org/W4297813615","https://openalex.org/W4300081896","https://openalex.org/W6600213771","https://openalex.org/W6600284362","https://openalex.org/W6638523607","https://openalex.org/W6638836233","https://openalex.org/W6674330103","https://openalex.org/W6677103964","https://openalex.org/W6677580257","https://openalex.org/W6679955943","https://openalex.org/W6682691769","https://openalex.org/W6683825394","https://openalex.org/W6695314431","https://openalex.org/W6719169591","https://openalex.org/W6726275242","https://openalex.org/W6731768130","https://openalex.org/W6733877748","https://openalex.org/W6737664043","https://openalex.org/W6743428213","https://openalex.org/W6743688258","https://openalex.org/W6755843862","https://openalex.org/W6762269264","https://openalex.org/W6771731465","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W3082178636","https://openalex.org/W2088845016","https://openalex.org/W589102260","https://openalex.org/W1966421350","https://openalex.org/W2782041652","https://openalex.org/W2894173309","https://openalex.org/W4387932263","https://openalex.org/W2098962763","https://openalex.org/W2371065793","https://openalex.org/W2157746493"],"abstract_inverted_index":{"Dropout":[0],"is":[1,101,138],"a":[2,8,11,48,57,73,121,139,168,252],"well-known":[3],"regularization":[4],"method":[5,209],"by":[6,27],"sampling":[7],"sub-network":[9],"from":[10,62],"larger":[12],"deep":[13],"neural":[14,40,66,195],"network":[15,201],"and":[16,104,132,150,220,229,233,238,267,273],"training":[17],"different":[18,21,211],"sub-networks":[19,61],"on":[20,210,222,249],"subsets":[22],"of":[23,50,59,188,213,241,255,259,271],"the":[24,28,88,107,113,133,142,147,151,156,180,189,200,207,223,235,242,260],"data.":[25],"Inspired":[26],"dropout":[29,176],"concept,":[30],"we":[31],"propose":[32],"EDropout":[33,192,248],"as":[34,175],"an":[35,63,183],"energy-based":[36,83],"framework":[37],"for":[38,128],"pruning":[39,52,80,99,130,148,169,179,190,236,253],"networks":[41,196,245],"in":[42,120,159],"classification":[43,239,275],"tasks.":[44],"In":[45],"this":[46],"approach,":[47],"set":[49,58],"binary":[51],"state":[53,100],"vectors":[54],"(population)":[55],"represents":[56],"corresponding":[60],"arbitrary":[64],"original":[65,108],"network.":[67,109,181],"An":[68],"energy":[69,75,95,143],"loss":[70,76],"function":[71],"assigns":[72],"scalar":[74],"value":[77],"to":[78,90,106,111,167,178],"each":[79,160],"state.":[81,170],"The":[82,97,124,162,244],"model":[84],"(EBM)":[85],"stochastically":[86],"evolves":[87],"population":[89,163],"find":[91],"states":[92,131],"with":[93,247,263],"lower":[94],"loss.":[96],"best":[98],"then":[102],"selected":[103],"applied":[105],"Similar":[110],"dropout,":[112],"kept":[114,157],"weights":[115],"are":[116],"updated":[117],"using":[118],"backpropagation":[119],"probabilistic":[122,152],"model.":[123],"EBM":[125],"again":[126],"searches":[127],"better":[129],"cycle":[134],"continuous.":[135],"This":[136,171],"procedure":[137],"switching":[140],"between":[141],"model,":[144,153],"which":[145,154],"manages":[146],"states,":[149],"updates":[155],"weights,":[158],"iteration.":[161],"can":[164,172,193],"dynamically":[165],"converge":[166],"be":[173],"interpreted":[174],"leading":[177],"From":[182],"implementation":[184],"perspective,":[185],"unlike":[186],"most":[187],"methods,":[191],"prune":[194],"without":[197],"manually":[198],"modifying":[199],"architecture":[202],"code.":[203],"We":[204],"have":[205],"evaluated":[206],"proposed":[208],"flavors":[212],"ResNets,":[214],"AlexNet,":[215],"l<sub>1</sub>":[216],"pruning,":[217],"ThinNet,":[218],"ChannelNet,":[219],"SqueezeNet":[221],"Kuzushiji,":[224],"Fashion,":[225],"CIFAR-10,":[226],"CIFAR-100,":[227],"Flowers,":[228],"ImageNet":[230],"data":[231],"sets,":[232],"compared":[234],"rate":[237,254],"performance":[240],"models.":[243],"trained":[246],"average":[250],"achieved":[251],"more":[256],"than":[257],"50%":[258],"trainable":[261],"parameters":[262],"approximately":[264],"<":[265,268],"5%":[266],"1%":[269],"drop":[270],"Top-1":[272],"Top-5":[274],"accuracy,":[276],"respectively.":[277]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-12T07:58:50.170612","created_date":"2025-10-10T00:00:00"}
