{"id":"https://openalex.org/W3187677606","doi":"https://doi.org/10.1109/tnnls.2022.3180209","title":"Spartus: A 9.4 TOp/s FPGA-Based LSTM Accelerator Exploiting Spatio-Temporal Sparsity","display_name":"Spartus: A 9.4 TOp/s FPGA-Based LSTM Accelerator Exploiting Spatio-Temporal Sparsity","publication_year":2022,"publication_date":"2022-06-10","ids":{"openalex":"https://openalex.org/W3187677606","doi":"https://doi.org/10.1109/tnnls.2022.3180209","mag":"3187677606","pmid":"https://pubmed.ncbi.nlm.nih.gov/35687629"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2022.3180209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3180209","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","datacite","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082967906","display_name":"Chang Gao","orcid":"https://orcid.org/0000-0002-3284-4078"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chang Gao","raw_affiliation_strings":["Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051651857","display_name":"Tobi Delbr\u00fcck","orcid":"https://orcid.org/0000-0001-5479-1141"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tobi Delbruck","raw_affiliation_strings":["Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053821067","display_name":"Shih\u2010Chii Liu","orcid":"https://orcid.org/0000-0002-7557-045X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shih-Chii Liu","raw_affiliation_strings":["Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Sensors Group, Institute of Neuroinformatics, University of Z&#x00FC;rich and ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5082967906"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":10.9736,"has_fulltext":false,"cited_by_count":46,"citation_normalized_percentile":{"value":0.99012745,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"35","issue":"1","first_page":"1098","last_page":"1112"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.8378286957740784},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7078378200531006},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.35357534885406494},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3498452603816986},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3223232626914978}],"concepts":[{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.8378286957740784},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7078378200531006},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.35357534885406494},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3498452603816986},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3223232626914978}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/tnnls.2022.3180209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3180209","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:35687629","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35687629","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null},{"id":"pmh:oai:www.zora.uzh.ch:217533","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401281","display_name":"Zurich Open Repository and Archive (University of Zurich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I202697423","host_organization_name":"University of Zurich","host_organization_lineage":["https://openalex.org/I202697423"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"Gao, Chao; Delbruck, Tobi; Liu, Shih-Chii  (2021). Spartus: A 9.4 TOp/s FPGA-based LSTM Accelerator Exploiting Spatio-temporal Sparsity.  ArXiv.org 2108.02297, Cornell University.","raw_type":"Working Paper"},{"id":"pmh:oai:arXiv.org:2108.02297","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.02297","pdf_url":"https://arxiv.org/pdf/2108.02297","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.5167/uzh-217533","is_oa":true,"landing_page_url":"https://doi.org/10.5167/uzh-217533","pdf_url":null,"source":{"id":"https://openalex.org/S7407051291","display_name":"Universit\u00e4t Z\u00fcrich, ZORA","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"},{"id":"doi:10.5167/uzh-231196","is_oa":true,"landing_page_url":"https://doi.org/10.5167/uzh-231196","pdf_url":null,"source":{"id":"https://openalex.org/S7407051291","display_name":"Universit\u00e4t Z\u00fcrich, ZORA","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:www.zora.uzh.ch:217533","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401281","display_name":"Zurich Open Repository and Archive (University of Zurich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I202697423","host_organization_name":"University of Zurich","host_organization_lineage":["https://openalex.org/I202697423"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"Gao, Chao; Delbruck, Tobi; Liu, Shih-Chii  (2021). Spartus: A 9.4 TOp/s FPGA-based LSTM Accelerator Exploiting Spatio-temporal Sparsity.  ArXiv.org 2108.02297, Cornell University.","raw_type":"Working Paper"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1395557198","display_name":null,"funder_award_id":"181010","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G1744075616","display_name":null,"funder_award_id":"185543","funder_id":"https://openalex.org/F4320326765","funder_display_name":"National Centre of Competence in Research Robotics"},{"id":"https://openalex.org/G3448440212","display_name":null,"funder_award_id":"185543","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G4186020712","display_name":null,"funder_award_id":"51NF40_185543","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4839563563","display_name":null,"funder_award_id":"BRIDGE","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G7192489655","display_name":null,"funder_award_id":"51NF40_185543","funder_id":"https://openalex.org/F4320326765","funder_display_name":"National Centre of Competence in Research Robotics"},{"id":"https://openalex.org/G7330217765","display_name":null,"funder_award_id":"51NF40_185543","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G7476027750","display_name":null,"funder_award_id":"51NF40","funder_id":"https://openalex.org/F4320326765","funder_display_name":"National Centre of Competence in Research Robotics"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320310967","display_name":"Universidad de Sevilla","ror":"https://ror.org/03yxnpp24"},{"id":"https://openalex.org/F4320315121","display_name":"Samsung Advanced Institute of Technology","ror":null},{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"},{"id":"https://openalex.org/F4320326765","display_name":"National Centre of Competence in Research Robotics","ror":null},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W179875071","https://openalex.org/W1494198834","https://openalex.org/W1596035946","https://openalex.org/W1635512741","https://openalex.org/W1999085092","https://openalex.org/W2002342963","https://openalex.org/W2064675550","https://openalex.org/W2095705004","https://openalex.org/W2127141656","https://openalex.org/W2143612262","https://openalex.org/W2147542748","https://openalex.org/W2157331557","https://openalex.org/W2193413348","https://openalex.org/W2293634267","https://openalex.org/W2582144945","https://openalex.org/W2585720638","https://openalex.org/W2623629680","https://openalex.org/W2730834423","https://openalex.org/W2761132374","https://openalex.org/W2788838111","https://openalex.org/W2904773682","https://openalex.org/W2915106038","https://openalex.org/W2940345045","https://openalex.org/W2943148367","https://openalex.org/W2962820060","https://openalex.org/W2962883174","https://openalex.org/W2963318827","https://openalex.org/W2964227577","https://openalex.org/W2964299589","https://openalex.org/W2982316857","https://openalex.org/W2997958396","https://openalex.org/W3005040076","https://openalex.org/W3009636589","https://openalex.org/W3027324516","https://openalex.org/W3108690123","https://openalex.org/W3127686677","https://openalex.org/W3190062760","https://openalex.org/W6631362777","https://openalex.org/W6674330103","https://openalex.org/W6687566353","https://openalex.org/W6732307519","https://openalex.org/W6734169003","https://openalex.org/W6744208968","https://openalex.org/W6748131973","https://openalex.org/W6751979845","https://openalex.org/W6773423997"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2111241003","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2096844293","https://openalex.org/W2363944576","https://openalex.org/W2351041855","https://openalex.org/W2570254841"],"abstract_inverted_index":{"Long":[0],"short-term":[1],"memory":[2,126],"(LSTM)":[3],"recurrent":[4],"networks":[5,74],"are":[6],"frequently":[7],"used":[8],"for":[9,68,153],"tasks":[10],"involving":[11],"time-sequential":[12],"data,":[13],"such":[14],"as":[15],"speech":[16,141],"recognition.":[17],"Unlike":[18],"previous":[19,109],"LSTM":[20,171],"accelerators":[21],"that":[22,40],"either":[23],"exploit":[24],"spatial":[25],"weight":[26,66,80,125],"sparsity":[27,43,50,81,103,118,167],"or":[28],"temporal":[29,102],"activation":[30],"sparsity,":[31],"this":[32],"article":[33],"proposes":[34],"a":[35,54,69,154],"new":[36,55],"accelerator":[37],"called":[38],"\"Spartus\"":[39],"exploits":[41],"spatio-temporal":[42,117,166],"to":[44,85,112,178,189],"achieve":[45,79,190],"ultralow":[46],"latency":[47,152],"inference.":[48],"Spatial":[49],"is":[51,135],"induced":[52],"using":[53,173],"column-balanced":[56],"targeted":[57],"dropout":[58],"(CBTD)":[59],"structured":[60,64],"pruning":[61],"method,":[62],"producing":[63],"sparse":[65],"matrices":[67],"balanced":[70],"workload.":[71],"The":[72,132],"pruned":[73],"running":[75],"on":[76,93,124,145,168],"Spartus":[77,133,150,183],"hardware":[78,187],"levels":[82],"of":[83,158,182],"up":[84],"96%":[86],"and":[87,96,121,128,137,147,195],"94%":[88],"with":[89,119],"negligible":[90],"accuracy":[91],"loss":[92],"the":[94,97,108,113,174],"TIMIT":[95,175],"Librispeech":[98],"datasets.":[99],"To":[100],"induce":[101],"in":[104],"LSTM,":[105],"we":[106],"extend":[107],"DeltaGRU":[110],"method":[111],"DeltaLSTM":[114,122,156],"method.":[115],"Combining":[116],"CBTD":[120],"saves":[123],"access":[127],"associated":[129],"arithmetic":[130],"operations.":[131],"architecture":[134],"scalable":[136],"supports":[138],"real-time":[139],"online":[140],"recognition":[142],"when":[143],"implemented":[144],"small":[146],"large":[148],"FPGAs.":[149],"per-sample":[151],"single":[155],"layer":[157],"1024":[159],"neurons":[160],"averages":[161],"1":[162],"\u03bc":[163],"s.":[164],"Exploiting":[165],"our":[169],"test":[170],"network":[172],"dataset":[176],"leads":[177],"46":[179],"\u00d7":[180],"speedup":[181],"over":[184],"its":[185],"theoretical":[186],"performance":[188],"9.4-TOp/s":[191],"effective":[192],"batch-1":[193],"throughput":[194],"1.1-TOp/s/W":[196],"power":[197],"efficiency.":[198]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":9}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
