{"id":"https://openalex.org/W2918006316","doi":"https://doi.org/10.1145/3289602.3293952","title":"Highly Efficient Sparse Neural Network Computing","display_name":"Highly Efficient Sparse Neural Network Computing","publication_year":2019,"publication_date":"2019-02-20","ids":{"openalex":"https://openalex.org/W2918006316","doi":"https://doi.org/10.1145/3289602.3293952","mag":"2918006316"},"language":"en","primary_location":{"id":"doi:10.1145/3289602.3293952","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3289602.3293952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 ACM/SIGDA International Symposium on Field-Programmable Gate Arrays","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112420086","display_name":"Yan-jie Gu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanjie Gu","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110151105","display_name":"Jian Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Yu","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003532531","display_name":"Tieli Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tieli Sun","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058959396","display_name":"Chen Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Pan","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010798470","display_name":"Zhenhao Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenhao Feng","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101490465","display_name":"Liewei Xu","orcid":"https://orcid.org/0000-0002-8422-3409"},"institutions":[{"id":"https://openalex.org/I4210132426","display_name":"Shanghai Fudan Microelectronics (China)","ror":"https://ror.org/02vfj3j86","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210132426"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liewei Xu","raw_affiliation_strings":["Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Fudan Microelectronics Group Company Limited, Shanghai, China","institution_ids":["https://openalex.org/I4210132426"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101530541","display_name":"Chang Wu","orcid":"https://orcid.org/0000-0003-2590-6338"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chang Wu","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5112420086"],"corresponding_institution_ids":["https://openalex.org/I4210132426"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0163508,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"121","last_page":"121"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8050118684768677},{"id":"https://openalex.org/keywords/multiplexer","display_name":"Multiplexer","score":0.6886379718780518},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6448768377304077},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6063017845153809},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5687571167945862},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5202202200889587},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5053210854530334},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.47897791862487793},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.45176297426223755},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.44406113028526306},{"id":"https://openalex.org/keywords/in-memory-processing","display_name":"In-Memory Processing","score":0.42741212248802185},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32366979122161865},{"id":"https://openalex.org/keywords/multiplexing","display_name":"Multiplexing","score":0.29550284147262573},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17349529266357422},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.13580942153930664}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8050118684768677},{"id":"https://openalex.org/C70970002","wikidata":"https://www.wikidata.org/wiki/Q189434","display_name":"Multiplexer","level":3,"score":0.6886379718780518},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6448768377304077},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6063017845153809},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5687571167945862},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5202202200889587},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5053210854530334},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.47897791862487793},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.45176297426223755},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.44406113028526306},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.42741212248802185},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32366979122161865},{"id":"https://openalex.org/C19275194","wikidata":"https://www.wikidata.org/wiki/Q222903","display_name":"Multiplexing","level":2,"score":0.29550284147262573},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17349529266357422},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.13580942153930664},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.0},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.0},{"id":"https://openalex.org/C194222762","wikidata":"https://www.wikidata.org/wiki/Q114486","display_name":"Query by Example","level":4,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3289602.3293952","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3289602.3293952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 ACM/SIGDA International Symposium on Field-Programmable Gate Arrays","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.46000000834465027}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W2146343568","https://openalex.org/W98480971","https://openalex.org/W2150291671","https://openalex.org/W2013643406","https://openalex.org/W2027972911","https://openalex.org/W2157978810","https://openalex.org/W3145926676","https://openalex.org/W3158396463"],"abstract_inverted_index":{"In":[0,86,200],"this":[1],"study,":[2],"we":[3,73,203],"propose":[4,74],"a":[5,60,75,79,95],"software-hardware":[6],"combined":[7],"solution":[8],"for":[9,166,184],"efficient":[10],"sparse":[11,25],"neural":[12,26],"network":[13,113],"computing.":[14],"Much":[15],"of":[16,63,102,139,146,197],"the":[17,29,36,51,67,90,100,118,147,159,194,201],"connections":[18],"between":[19],"each":[20,143],"layers":[21],"are":[22,31,92,136],"pruned":[23],"in":[24,32,94,142,158],"network.":[27],"Usually":[28],"weights":[30,53],"compressed":[33,52],"format,":[34],"but":[35],"corresponding":[37],"feature":[38],"map":[39],"data":[40,68,82,91,170],"need":[41],"to":[42,47,65,205],"be":[43,105,153],"pared":[44],"before":[45],"passing":[46],"computation":[48],"engine.":[49],"Since":[50],"require":[54],"indirect":[55],"memory":[56],"access,":[57],"there":[58,135],"needs":[59],"large":[61],"amount":[62,196],"multiplexers":[64],"locate":[66],"position.":[69],"Motivated":[70],"by":[71],"this,":[72],"new":[76],"architecture":[77,178],"with":[78,110,117,190,193],"much":[80],"smaller":[81,96],"selection":[83],"multiplexer":[84,103],"design.":[85,216],"our":[87,111,124,177,208,214],"hardware":[88,215],"architecture,":[89],"selected":[93],"range":[97],"so":[98],"that":[99,134,176],"scale":[101],"can":[104,152,179],"reduced.":[106],"This":[107],"is":[108],"paired":[109],"software":[112],"pruning":[114,122,209],"method.":[115],"Compared":[116],"structured":[119],"or":[120],"pattern-based":[121],"method,":[123],"algorithm":[125],"does":[126],"not":[127],"impose":[128],"such":[129],"restriction":[130],"and":[131,211],"just":[132],"ensure":[133],"same":[137,195],"numbers":[138],"non-zero":[140,150],"elements":[141,151],"z-channel":[144],"array":[145],"weights.":[148],"The":[149],"distributed":[154],"at":[155],"any":[156],"position":[157],"array.":[160],"We":[161],"also":[162],"use":[163],"dual":[164],"channel":[165],"better":[167],"efficiency":[168],"on":[169],"scheduling.":[171],"Our":[172],"experimental":[173],"results":[174],"show":[175],"reach":[180],"3x":[181],"overall":[182],"speedup":[183],"25%":[185],"sparsity":[186],"networks":[187],"when":[188],"compared":[189],"non-sparse":[191],"engines":[192],"computing":[198],"resources.":[199],"future,":[202],"plan":[204],"further":[206],"improve":[207],"algorithm,":[210],"tape":[212],"out":[213]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
