{"id":"https://openalex.org/W4320067931","doi":"https://doi.org/10.1145/3545008.3545086","title":"DSSA: Dual-Side Sparse Systolic Array Architecture for Accelerating Convolutional Neural Network Training","display_name":"DSSA: Dual-Side Sparse Systolic Array Architecture for Accelerating Convolutional Neural Network Training","publication_year":2022,"publication_date":"2022-08-29","ids":{"openalex":"https://openalex.org/W4320067931","doi":"https://doi.org/10.1145/3545008.3545086"},"language":"en","primary_location":{"id":"doi:10.1145/3545008.3545086","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3545008.3545086","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 51st International Conference on Parallel Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103161855","display_name":"Zhengbo Chen","orcid":"https://orcid.org/0000-0002-1208-0760"},"institutions":[{"id":"https://openalex.org/I40246663","display_name":"Chinese Academy of Engineering","ror":"https://ror.org/00z3yke57","country_code":"CN","type":"other","lineage":["https://openalex.org/I40246663"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhengbo Chen","raw_affiliation_strings":["Chinese Academy of Engineering, China","Information Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chinese Academy of Engineering, China","institution_ids":["https://openalex.org/I40246663"]},{"raw_affiliation_string":"Information Engineering University, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100745056","display_name":"Qi Yu","orcid":"https://orcid.org/0000-0003-3969-6634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi Yu","raw_affiliation_strings":["State Key Laboratory of Mathematical Engineering and Advanced Computing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Mathematical Engineering and Advanced Computing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101665003","display_name":"Zheng Fang","orcid":"https://orcid.org/0000-0002-1291-7022"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang Zheng","raw_affiliation_strings":["State Key Laboratory of Mathematical Engineering and Advanced Computing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Mathematical Engineering and Advanced Computing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101556960","display_name":"Feng Guo","orcid":"https://orcid.org/0000-0001-8131-9301"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng Guo","raw_affiliation_strings":["State Key Laboratory of Mathematical Engineering and Advanced Computing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Mathematical Engineering and Advanced Computing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051366939","display_name":"Zuoning Chen","orcid":"https://orcid.org/0000-0003-1975-5414"},"institutions":[{"id":"https://openalex.org/I40246663","display_name":"Chinese Academy of Engineering","ror":"https://ror.org/00z3yke57","country_code":"CN","type":"other","lineage":["https://openalex.org/I40246663"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuoning Chen","raw_affiliation_strings":["Chinese Academy of Engineering, China","Information Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chinese Academy of Engineering, China","institution_ids":["https://openalex.org/I40246663"]},{"raw_affiliation_string":"Information Engineering University, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103161855"],"corresponding_institution_ids":["https://openalex.org/I40246663"],"apc_list":null,"apc_paid":null,"fwci":0.203,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.50666496,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9829999804496765,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/systolic-array","display_name":"Systolic array","score":0.8565400838851929},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7421626448631287},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7204573750495911},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6603454351425171},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6387725472450256},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.541790246963501},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5372642278671265},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5199353098869324},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.36566925048828125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30785036087036133},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.1402934193611145},{"id":"https://openalex.org/keywords/very-large-scale-integration","display_name":"Very-large-scale integration","score":0.09279900789260864}],"concepts":[{"id":"https://openalex.org/C150741067","wikidata":"https://www.wikidata.org/wiki/Q2377218","display_name":"Systolic array","level":3,"score":0.8565400838851929},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7421626448631287},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7204573750495911},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6603454351425171},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6387725472450256},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.541790246963501},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5372642278671265},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5199353098869324},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.36566925048828125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30785036087036133},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.1402934193611145},{"id":"https://openalex.org/C14580979","wikidata":"https://www.wikidata.org/wiki/Q876049","display_name":"Very-large-scale integration","level":2,"score":0.09279900789260864},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3545008.3545086","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3545008.3545086","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 51st International Conference on Parallel Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1841592590","https://openalex.org/W1996901117","https://openalex.org/W2112796928","https://openalex.org/W2128853364","https://openalex.org/W2155893237","https://openalex.org/W2163605009","https://openalex.org/W2193145675","https://openalex.org/W2194775991","https://openalex.org/W2285660444","https://openalex.org/W2579241114","https://openalex.org/W2606722458","https://openalex.org/W2625457103","https://openalex.org/W2794952988","https://openalex.org/W2895394565","https://openalex.org/W2900228909","https://openalex.org/W2908078360","https://openalex.org/W2945146780","https://openalex.org/W2980186997","https://openalex.org/W3007021848","https://openalex.org/W3016542674","https://openalex.org/W3040024858","https://openalex.org/W3092640258","https://openalex.org/W3103168911","https://openalex.org/W3106250896","https://openalex.org/W3155922894","https://openalex.org/W3187908937","https://openalex.org/W6683738474","https://openalex.org/W6725543821"],"related_works":["https://openalex.org/W34241620","https://openalex.org/W1509211761","https://openalex.org/W2391299576","https://openalex.org/W2133693067","https://openalex.org/W1531488649","https://openalex.org/W1602905143","https://openalex.org/W3037767301","https://openalex.org/W1585350690","https://openalex.org/W2366027386","https://openalex.org/W2582456645"],"abstract_inverted_index":{"Ever-growing":[0],"CNN":[1],"size":[2],"incurs":[3],"a":[4,50],"significant":[5,64],"amount":[6],"of":[7,52,91,98],"redundancy":[8],"in":[9,13],"model":[10,27],"parameters,":[11],"which":[12],"turn,":[14],"puts":[15],"considerable":[16],"burden":[17],"on":[18,43],"hardware.":[19],"Unstructured":[20],"pruning":[21,35],"is":[22],"widely":[23],"used":[24],"to":[25,39],"reduce":[26],"sparsity.":[28],"While,":[29],"the":[30,58,96],"irregularity":[31],"introduced":[32],"by":[33],"unstructured":[34],"makes":[36],"it":[37,76],"difficult":[38],"accelerate":[40],"sparse":[41,60],"CNNs":[42],"systolic":[44,67,93],"array.":[45,68],"To":[46],"address":[47],"this":[48],"issue,":[49],"variety":[51],"accelerators":[53],"have":[54],"been":[55],"proposed.":[56],"SIGMA,":[57],"state-of-the-art":[59],"GEMM":[61],"accelerator,":[62],"achieves":[63],"speedup":[65],"over":[66],"However,":[69],"SIGMA":[70,88],"suffers":[71],"from":[72],"two":[73],"disadvantages:":[74],"1)":[75],"only":[77],"supports":[78],"one-side":[79],"sparsity,":[80],"leaving":[81],"potential":[82],"for":[83],"further":[84],"performance":[85],"gains;":[86],"2)":[87],"improves":[89],"utilization":[90],"large-sized":[92],"arrays":[94],"at":[95],"cost":[97],"extra":[99],"overhead.":[100]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-30T09:04:40.226872","created_date":"2025-10-10T00:00:00"}
