{"id":"https://openalex.org/W3130673459","doi":"https://doi.org/10.1109/tpds.2020.3047003","title":"Parallel Blockwise Knowledge Distillation for Deep Neural Network Compression","display_name":"Parallel Blockwise Knowledge Distillation for Deep Neural Network Compression","publication_year":2020,"publication_date":"2020-12-23","ids":{"openalex":"https://openalex.org/W3130673459","doi":"https://doi.org/10.1109/tpds.2020.3047003","mag":"3130673459"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2020.3047003","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3047003","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002287514","display_name":"Cody Blakeney","orcid":"https://orcid.org/0000-0002-1412-2813"},"institutions":[{"id":"https://openalex.org/I13511017","display_name":"Texas State University","ror":"https://ror.org/05h9q1g27","country_code":"US","type":"education","lineage":["https://openalex.org/I13511017"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Cody Blakeney","raw_affiliation_strings":["Department of Computer Science, Texas State University, San Marcos, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Texas State University, San Marcos, TX, USA","institution_ids":["https://openalex.org/I13511017"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042058386","display_name":"Xiaomin Li","orcid":"https://orcid.org/0000-0001-7587-0543"},"institutions":[{"id":"https://openalex.org/I13511017","display_name":"Texas State University","ror":"https://ror.org/05h9q1g27","country_code":"US","type":"education","lineage":["https://openalex.org/I13511017"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaomin Li","raw_affiliation_strings":["Department of Computer Science, Texas State University, San Marcos, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Texas State University, San Marcos, TX, USA","institution_ids":["https://openalex.org/I13511017"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100395059","display_name":"Yan Yan","orcid":"https://orcid.org/0000-0002-3674-7160"},"institutions":[{"id":"https://openalex.org/I13511017","display_name":"Texas State University","ror":"https://ror.org/05h9q1g27","country_code":"US","type":"education","lineage":["https://openalex.org/I13511017"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yan Yan","raw_affiliation_strings":["Department of Computer Science, Texas State University, San Marcos, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Texas State University, San Marcos, TX, USA","institution_ids":["https://openalex.org/I13511017"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008451482","display_name":"Ziliang Zong","orcid":"https://orcid.org/0000-0003-2693-7419"},"institutions":[{"id":"https://openalex.org/I13511017","display_name":"Texas State University","ror":"https://ror.org/05h9q1g27","country_code":"US","type":"education","lineage":["https://openalex.org/I13511017"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ziliang Zong","raw_affiliation_strings":["Department of Computer Science, Texas State University, San Marcos, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Texas State University, San Marcos, TX, USA","institution_ids":["https://openalex.org/I13511017"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5002287514"],"corresponding_institution_ids":["https://openalex.org/I13511017"],"apc_list":null,"apc_paid":null,"fwci":2.2471,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.90236607,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"32","issue":"7","first_page":"1765","last_page":"1776"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8983985781669617},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8387411832809448},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.7998173236846924},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5734822154045105},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5325132012367249},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5213236212730408},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.4548649191856384},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3002195954322815},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27726805210113525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8983985781669617},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8387411832809448},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.7998173236846924},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5734822154045105},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5325132012367249},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5213236212730408},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.4548649191856384},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3002195954322815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27726805210113525},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2020.3047003","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3047003","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8500000238418579,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":78,"referenced_works":["https://openalex.org/W587794757","https://openalex.org/W1686810756","https://openalex.org/W1724438581","https://openalex.org/W1821462560","https://openalex.org/W1841592590","https://openalex.org/W1996901117","https://openalex.org/W2117539524","https://openalex.org/W2119144962","https://openalex.org/W2131524184","https://openalex.org/W2162390675","https://openalex.org/W2167215970","https://openalex.org/W2172734211","https://openalex.org/W2194775991","https://openalex.org/W2233116163","https://openalex.org/W2276892413","https://openalex.org/W2294370754","https://openalex.org/W2525778437","https://openalex.org/W2533256678","https://openalex.org/W2565851976","https://openalex.org/W2585720638","https://openalex.org/W2612445135","https://openalex.org/W2612864759","https://openalex.org/W2619096655","https://openalex.org/W2625457103","https://openalex.org/W2756085244","https://openalex.org/W2769312802","https://openalex.org/W2783873922","https://openalex.org/W2787752464","https://openalex.org/W2793950911","https://openalex.org/W2796450314","https://openalex.org/W2799042347","https://openalex.org/W2808373772","https://openalex.org/W2808434111","https://openalex.org/W2907670226","https://openalex.org/W2950248853","https://openalex.org/W2950967261","https://openalex.org/W2963048316","https://openalex.org/W2963374099","https://openalex.org/W2963674932","https://openalex.org/W2963723401","https://openalex.org/W2963809228","https://openalex.org/W2963959597","https://openalex.org/W2964203871","https://openalex.org/W2964299589","https://openalex.org/W2972087877","https://openalex.org/W2972284200","https://openalex.org/W2983118306","https://openalex.org/W3004424267","https://openalex.org/W3080135165","https://openalex.org/W3118608800","https://openalex.org/W3121404598","https://openalex.org/W4240168186","https://openalex.org/W4289082871","https://openalex.org/W4289143739","https://openalex.org/W4297736277","https://openalex.org/W4297775537","https://openalex.org/W6617368339","https://openalex.org/W6637373629","https://openalex.org/W6637709462","https://openalex.org/W6638523607","https://openalex.org/W6638783484","https://openalex.org/W6677580257","https://openalex.org/W6679667936","https://openalex.org/W6683722107","https://openalex.org/W6684563725","https://openalex.org/W6685500198","https://openalex.org/W6726983090","https://openalex.org/W6737664043","https://openalex.org/W6738642365","https://openalex.org/W6744495609","https://openalex.org/W6745722055","https://openalex.org/W6748163181","https://openalex.org/W6748171661","https://openalex.org/W6750964650","https://openalex.org/W6757246177","https://openalex.org/W6767601142","https://openalex.org/W6769213770","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W2317245370","https://openalex.org/W4249323025","https://openalex.org/W198851386","https://openalex.org/W2030310580","https://openalex.org/W947442053","https://openalex.org/W1980160788","https://openalex.org/W2148915962","https://openalex.org/W2283866686","https://openalex.org/W4287182096","https://openalex.org/W27867058"],"abstract_inverted_index":{"Deep":[0],"neural":[1],"networks":[2],"(DNNs)":[3],"have":[4,57],"been":[5,58],"extremely":[6],"successful":[7],"in":[8,14,216],"solving":[9],"many":[10],"challenging":[11],"AI":[12],"tasks":[13],"natural":[15],"language":[16],"processing,":[17],"speech":[18],"recognition,":[19],"and":[20,32,54,64,140,148,184],"computer":[21],"vision":[22],"nowadays.":[23],"However,":[24,89],"DNNs":[25],"are":[26],"typically":[27],"computation":[28],"intensive,":[29],"memory":[30],"demanding,":[31],"power":[33,65],"hungry,":[34],"which":[35],"significantly":[36],"limits":[37],"their":[38],"usage":[39],"on":[40,158,181,192],"platforms":[41],"with":[42,162,196],"constrained":[43],"resources.":[44],"Therefore,":[45],"a":[46,85,106,217],"variety":[47],"of":[48,67,74,84,117,202],"compression":[49,76],"techniques":[50,77],"(e.g.,":[51,145],"quantization,":[52],"pruning,":[53],"knowledge":[55,70],"distillation)":[56],"proposed":[59],"to":[60,96,112,125,209],"reduce":[61,81],"the":[62,75,82,114,135],"size":[63,83],"consumption":[66],"DNNs.":[68,119],"Blockwise":[69],"distillation":[71,110,115,204],"is":[72,91],"one":[73],"that":[78,151,169],"can":[79,172,205],"effectively":[80],"highly":[86],"complex":[87],"DNN.":[88],"it":[90],"not":[92],"widely":[93],"adopted":[94],"due":[95],"its":[97],"long":[98],"training":[99],"time.":[100],"In":[101],"this":[102],"article,":[103],"we":[104],"propose":[105],"novel":[107],"parallel":[108],"blockwise":[109,128],"algorithm":[111,121,171],"accelerate":[113],"process":[116],"sophisticated":[118],"Our":[120],"leverages":[122],"local":[123],"information":[124],"conduct":[126],"independent":[127],"distillation,":[129,183,194],"utilizes":[130],"depthwise":[131],"separable":[132],"layers":[133],"as":[134],"efficient":[136],"replacement":[137],"block":[138],"architecture,":[139],"properly":[141],"addresses":[142],"limiting":[143],"factors":[144],"dependency,":[146],"synchronization,":[147],"load":[149],"balancing)":[150],"affect":[152],"parallelism.":[153],"The":[154,200],"experimental":[155],"results":[156],"running":[157],"an":[159],"AMD":[160],"server":[161],"four":[163,213],"Geforce":[164],"RTX":[165],"2080Ti":[166],"GPUs":[167,215],"show":[168],"our":[170],"achieve":[173],"3x":[174],"speedup":[175,186,201],"plus":[176,187],"19":[177],"percent":[178,189],"energy":[179,190],"savings":[180,191],"VGG":[182],"3.5x":[185],"29":[188],"ResNet":[193,203],"both":[195],"negligible":[197],"accuracy":[198],"loss.":[199],"be":[206],"further":[207],"improved":[208],"3.87":[210],"when":[211],"using":[212],"RTX6000":[214],"distributed":[218],"cluster.":[219]},"counts_by_year":[{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
