{"id":"https://openalex.org/W2963300701","doi":"https://doi.org/10.1109/tvlsi.2019.2927375","title":"A 3.89-GOPS/mW Scalable Recurrent Neural Network Processor With Improved Efficiency on Memory and Computation","display_name":"A 3.89-GOPS/mW Scalable Recurrent Neural Network Processor With Improved Efficiency on Memory and Computation","publication_year":2019,"publication_date":"2019-07-24","ids":{"openalex":"https://openalex.org/W2963300701","doi":"https://doi.org/10.1109/tvlsi.2019.2927375","mag":"2963300701"},"language":"en","primary_location":{"id":"doi:10.1109/tvlsi.2019.2927375","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2019.2927375","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063249831","display_name":"Jiaquan Wu","orcid":"https://orcid.org/0000-0002-1155-1321"},"institutions":[{"id":"https://openalex.org/I4210092088","display_name":"Zhejiang Province Institute of Architectural Design and Research","ror":"https://ror.org/00f89ms08","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210092088"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaquan Wu","raw_affiliation_strings":["Institute of VLSI Design, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-1155-1321","affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4210092088","https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090231471","display_name":"Feiteng Li","orcid":"https://orcid.org/0000-0003-3032-9782"},"institutions":[{"id":"https://openalex.org/I4210092088","display_name":"Zhejiang Province Institute of Architectural Design and Research","ror":"https://ror.org/00f89ms08","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210092088"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feiteng Li","raw_affiliation_strings":["Institute of VLSI Design, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-3032-9782","affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4210092088","https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100716616","display_name":"Zhijian Chen","orcid":"https://orcid.org/0000-0002-5844-0135"},"institutions":[{"id":"https://openalex.org/I4210092088","display_name":"Zhejiang Province Institute of Architectural Design and Research","ror":"https://ror.org/00f89ms08","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210092088"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhijian Chen","raw_affiliation_strings":["Institute of VLSI Design, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-5844-0135","affiliations":[{"raw_affiliation_string":"Institute of VLSI Design, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I4210092088","https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046536624","display_name":"Xiaoyan Xiang","orcid":"https://orcid.org/0000-0002-5602-2749"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyan Xiang","raw_affiliation_strings":["State Key Laboratory of ASIC and System, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-5602-2749","affiliations":[{"raw_affiliation_string":"State Key Laboratory of ASIC and System, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5063249831"],"corresponding_institution_ids":["https://openalex.org/I4210092088","https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.919,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.79197932,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"27","issue":"12","first_page":"2939","last_page":"2943"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8051935434341431},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.7949104905128479},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7318623661994934},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.649830162525177},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5654522180557251},{"id":"https://openalex.org/keywords/network-topology","display_name":"Network topology","score":0.4894336760044098},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4869135618209839},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.40105608105659485},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3873399496078491},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3547118008136749},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2008647322654724},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.1457560956478119},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13351571559906006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8051935434341431},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.7949104905128479},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7318623661994934},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.649830162525177},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5654522180557251},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.4894336760044098},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4869135618209839},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.40105608105659485},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3873399496078491},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3547118008136749},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2008647322654724},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.1457560956478119},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13351571559906006},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tvlsi.2019.2927375","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2019.2927375","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8999999761581421,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G8167686772","display_name":null,"funder_award_id":"61801425","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1496120315","https://openalex.org/W1591801644","https://openalex.org/W1689711448","https://openalex.org/W2064675550","https://openalex.org/W2069562172","https://openalex.org/W2119144962","https://openalex.org/W2143612262","https://openalex.org/W2157331557","https://openalex.org/W2284628133","https://openalex.org/W2285660444","https://openalex.org/W2289615953","https://openalex.org/W2625468380","https://openalex.org/W2730834423","https://openalex.org/W2757698722","https://openalex.org/W2914294010","https://openalex.org/W2963820107","https://openalex.org/W2964299589","https://openalex.org/W3026054707","https://openalex.org/W6635446068","https://openalex.org/W6677580257","https://openalex.org/W6695553435","https://openalex.org/W6696711501"],"related_works":["https://openalex.org/W4298287631","https://openalex.org/W2953061907","https://openalex.org/W1847088711","https://openalex.org/W4225394202","https://openalex.org/W3036642985","https://openalex.org/W3032952384","https://openalex.org/W2964335273","https://openalex.org/W2982145560","https://openalex.org/W2969450769","https://openalex.org/W2326447594"],"abstract_inverted_index":{"Recurrent":[0],"neural":[1],"networks":[2],"(RNNs)":[3],"perform":[4],"excellently":[5],"on":[6,37,159],"sequencing":[7],"tasks":[8],"but":[9],"are":[10],"severely":[11],"restricted":[12],"by":[13,49],"the":[14,51,67,77,123,126,132,137,160,193],"complex":[15],"computations":[16],"and":[17,80,93,171,179],"intensive":[18],"memory":[19,156],"consumption":[20],"due":[21],"to":[22,34,113],"their":[23],"internal":[24],"fully":[25],"connected":[26],"topologies,":[27],"thereby":[28],"making":[29],"it":[30],"a":[31,119,141,165],"great":[32],"challenge":[33],"implement":[35],"RNNs":[36],"embedded":[38],"devices.":[39],"In":[40],"this":[41,162],"brief,":[42],"we":[43],"propose":[44],"an":[45,58],"energy-efficient":[46],"RNN":[47,101,197],"processor":[48,116,139,163],"exploiting":[50],"data":[52],"locality":[53],"in":[54,87,118,131],"network":[55,127],"compression":[56],"using":[57],"innovative":[59],"quantified":[60],"sparse":[61],"matrix":[62],"encoding":[63],"format.":[64],"Compared":[65],"with":[66,122,150,175],"conventional":[68],"processors":[69],"for":[70],"compressed":[71],"RNNs,":[72],"more":[73],"than":[74],"80%":[75],"of":[76,100,125,144,153,168,192],"weight":[78],"fetching":[79],"matrix-vector":[81],"multiplications":[82],"can":[83],"be":[84],"further":[85],"reduced":[86],"applications,":[88],"such":[89],"as":[90],"natural":[91],"language":[92],"keyword":[94],"spotting.":[95],"To":[96],"handle":[97],"different":[98],"scales":[99],"models":[102],"without":[103],"introducing":[104],"significant":[105],"interactive":[106],"overhead,":[107],"scalable":[108],"hardware":[109],"architecture":[110],"is":[111,190],"presented":[112],"organize":[114],"multiple":[115],"engines":[117],"spatial":[120],"fashion":[121],"assistance":[124],"cross-division":[128],"strategy.":[129],"Synthesized":[130],"SMIC":[133],"40LL":[134],"CMOS":[135],"process,":[136],"prototype":[138],"has":[140],"total":[142],"area":[143],"0.65":[145],"mm":[146],"<sup":[147],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[149],"95.5":[151],"kB":[152],"static":[154],"random-access":[155],"capacity.":[157],"Based":[158],"simulation,":[161],"achieves":[164],"peak":[166,183],"performance":[167],"24":[169],"GOPS":[170],"dissipates":[172],"6.16-mW":[173],"power":[174],"1.1":[176],"V":[177],"supply":[178],"200":[180],"MHz.":[181],"The":[182],"energy":[184],"efficiency":[185],"reaches":[186],"3.89":[187],"GOPS/mW,":[188],"which":[189],"state":[191],"art":[194],"among":[195],"existing":[196],"accelerators.":[198]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
