{"id":"https://openalex.org/W3092357178","doi":"https://doi.org/10.1109/dac18072.2020.9218710","title":"SparseTrain: Exploiting Dataflow Sparsity for Efficient Convolutional Neural Networks Training","display_name":"SparseTrain: Exploiting Dataflow Sparsity for Efficient Convolutional Neural Networks Training","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3092357178","doi":"https://doi.org/10.1109/dac18072.2020.9218710","mag":"3092357178"},"language":"en","primary_location":{"id":"doi:10.1109/dac18072.2020.9218710","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac18072.2020.9218710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 57th ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100705693","display_name":"Pengcheng Dai","orcid":"https://orcid.org/0000-0003-1455-7216"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pengcheng Dai","raw_affiliation_strings":["School of Microelectronics, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Microelectronics, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053303853","display_name":"Jianlei Yang","orcid":"https://orcid.org/0000-0001-8424-7040"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianlei Yang","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003076964","display_name":"Xucheng Ye","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xucheng Ye","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082464125","display_name":"Xingzhou Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingzhou Cheng","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101912906","display_name":"Junyu Luo","orcid":"https://orcid.org/0009-0001-6894-1144"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junyu Luo","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036239104","display_name":"Linghao Song","orcid":"https://orcid.org/0000-0002-7450-2842"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linghao Song","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058073627","display_name":"Yiran Chen","orcid":"https://orcid.org/0000-0002-1486-8412"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiran Chen","raw_affiliation_strings":["School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109540745","display_name":"Weisheng Zhao","orcid":"https://orcid.org/0009-0003-1386-4887"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weisheng Zhao","raw_affiliation_strings":["School of Microelectronics, BDBC, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Microelectronics, BDBC, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100705693"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":1.8563,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.88031861,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.8979165554046631},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8561815619468689},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.835182249546051},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.773824155330658},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7200175523757935},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6182191967964172},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5652202367782593},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5334838628768921},{"id":"https://openalex.org/keywords/dataflow-architecture","display_name":"Dataflow architecture","score":0.5039612650871277},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.47887176275253296},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.4630010724067688},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.42791467905044556},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.4238860309123993},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.42342427372932434},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4153272211551666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40193286538124084},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3777690827846527},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3632815182209015}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.8979165554046631},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8561815619468689},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.835182249546051},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.773824155330658},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7200175523757935},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6182191967964172},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5652202367782593},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5334838628768921},{"id":"https://openalex.org/C176727019","wikidata":"https://www.wikidata.org/wiki/Q1172415","display_name":"Dataflow architecture","level":3,"score":0.5039612650871277},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.47887176275253296},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4630010724067688},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.42791467905044556},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.4238860309123993},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.42342427372932434},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4153272211551666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40193286538124084},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3777690827846527},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3632815182209015},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dac18072.2020.9218710","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac18072.2020.9218710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 57th ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8899999856948853,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2041811089","https://openalex.org/W2119144962","https://openalex.org/W2140609507","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2285660444","https://openalex.org/W2442974303","https://openalex.org/W2470394683","https://openalex.org/W2605135468","https://openalex.org/W2606722458","https://openalex.org/W2613718673","https://openalex.org/W2625457103","https://openalex.org/W2754526845","https://openalex.org/W2801748224","https://openalex.org/W2807239565","https://openalex.org/W2905104204","https://openalex.org/W2919115771","https://openalex.org/W2921118685","https://openalex.org/W2949989598","https://openalex.org/W2962818002","https://openalex.org/W2964004663","https://openalex.org/W2964299589","https://openalex.org/W2982644126","https://openalex.org/W3107472389","https://openalex.org/W6677580257","https://openalex.org/W6680902425","https://openalex.org/W6684191040","https://openalex.org/W6738460352","https://openalex.org/W6744208968","https://openalex.org/W6759948036","https://openalex.org/W6766422263"],"related_works":["https://openalex.org/W2564598376","https://openalex.org/W1484403103","https://openalex.org/W2584408851","https://openalex.org/W2115158825","https://openalex.org/W2101960124","https://openalex.org/W4377693460","https://openalex.org/W2783505431","https://openalex.org/W2521947294","https://openalex.org/W2070353846","https://openalex.org/W4236419692"],"abstract_inverted_index":{"Training":[0],"Convolutional":[1],"Neural":[2],"Networks":[3],"(CNNs)":[4],"usually":[5],"requires":[6],"a":[7,47,89,113],"large":[8],"number":[9],"of":[10,33,56,103],"computational":[11],"resources.":[12],"In":[13],"this":[14],"paper,":[15],"SparseTrain":[16,138],"is":[17,92],"proposed":[18,93],"to":[19,71,117],"accelerate":[20],"CNN":[21,104],"training":[22,40,65,95,155],"by":[23,86,105],"fully":[24],"exploiting":[25],"the":[26,54,119,125,153],"sparsity.":[27],"It":[28],"mainly":[29],"involves":[30],"three":[31],"levels":[32],"innovations:":[34],"activation":[35],"gradients":[36,58],"pruning":[37,49,87],"algorithm,":[38],"sparse":[39],"dataflow,":[41],"and":[42,67,82,101,121,144],"accelerator":[43],"architecture.":[44],"By":[45],"applying":[46],"stochastic":[48],"algorithm":[50],"on":[51,124,134,149],"each":[52],"layer,":[53],"sparsity":[55,75,84],"back-propagation":[57,102],"can":[59],"be":[60],"increased":[61],"dramatically":[62],"without":[63],"degrading":[64],"accuracy":[66],"convergence":[68],"rate.":[69],"Moreover,":[70],"utilize":[72],"both":[73],"natural":[74],"(resulted":[76],"from":[77],"ReLU":[78],"or":[79],"Pooling":[80],"layers)":[81],"artificial":[83],"(brought":[85],"algorithm),":[88],"sparse-aware":[90],"architecture":[91,98,115],"for":[94],"acceleration.":[96],"This":[97],"supports":[99],"forward":[100],"adopting":[106],"1-Dimensional":[107],"convolution":[108],"dataflow.":[109],"We":[110],"have":[111],"built":[112],"cycle-accurate":[114],"simulator":[116],"evaluate":[118],"performance":[120],"efficiency":[122,147],"based":[123],"synthesized":[126],"design":[127],"with":[128,152],"14nm":[129],"FinFET":[130],"technologies.":[131],"Evaluation":[132],"results":[133],"AlexNet/ResNet":[135],"show":[136],"that":[137],"could":[139],"achieve":[140],"about":[141],"2.7\u00d7":[142],"speedup":[143],"2.2\u00d7":[145],"energy":[146],"improvement":[148],"average":[150],"compared":[151],"original":[154],"process.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":4}],"updated_date":"2026-01-09T23:09:53.351390","created_date":"2025-10-10T00:00:00"}
