{"id":"https://openalex.org/W3015688608","doi":"https://doi.org/10.1109/icassp40776.2020.9053228","title":"A Fifo Based Accelerator for Convolutional Neural Networks","display_name":"A Fifo Based Accelerator for Convolutional Neural Networks","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015688608","doi":"https://doi.org/10.1109/icassp40776.2020.9053228","mag":"3015688608"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9053228","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053228","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061853701","display_name":"Vineet Panchbhaiyye","orcid":null},"institutions":[{"id":"https://openalex.org/I16269868","display_name":"Santa Clara University","ror":"https://ror.org/03ypqe447","country_code":"US","type":"education","lineage":["https://openalex.org/I16269868"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Vineet Panchbhaiyye","raw_affiliation_strings":["Department of Electrical Engineering, Santa Clara University, Santa Clara, CA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Santa Clara University, Santa Clara, CA","institution_ids":["https://openalex.org/I16269868"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025538938","display_name":"Tokunbo Ogunfunmi","orcid":"https://orcid.org/0000-0003-3517-9779"},"institutions":[{"id":"https://openalex.org/I16269868","display_name":"Santa Clara University","ror":"https://ror.org/03ypqe447","country_code":"US","type":"education","lineage":["https://openalex.org/I16269868"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tokunbo Ogunfunmi","raw_affiliation_strings":["Department of Electrical Engineering, Santa Clara University, Santa Clara, CA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Santa Clara University, Santa Clara, CA","institution_ids":["https://openalex.org/I16269868"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5061853701"],"corresponding_institution_ids":["https://openalex.org/I16269868"],"apc_list":null,"apc_paid":null,"fwci":0.3908,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.60296095,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1758","last_page":"1762"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8525546789169312},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6526829600334167},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5046459436416626},{"id":"https://openalex.org/keywords/application-specific-integrated-circuit","display_name":"Application-specific integrated circuit","score":0.503278911113739},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4630546569824219},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4550120234489441},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.44538065791130066},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.43718841671943665},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.4247824549674988},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.4197429418563843},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4018205404281616},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.39269137382507324},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3843449354171753},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3449889123439789},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3104170858860016}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8525546789169312},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6526829600334167},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5046459436416626},{"id":"https://openalex.org/C77390884","wikidata":"https://www.wikidata.org/wiki/Q217302","display_name":"Application-specific integrated circuit","level":2,"score":0.503278911113739},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4630546569824219},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4550120234489441},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.44538065791130066},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43718841671943665},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.4247824549674988},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.4197429418563843},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4018205404281616},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.39269137382507324},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3843449354171753},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3449889123439789},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3104170858860016},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9053228","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053228","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.8199999928474426}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1665214252","https://openalex.org/W1686810756","https://openalex.org/W1832693441","https://openalex.org/W2289252105","https://openalex.org/W2553762784","https://openalex.org/W2591982329","https://openalex.org/W2604319603","https://openalex.org/W2766143712","https://openalex.org/W2798992029","https://openalex.org/W2919115771","https://openalex.org/W2962835968","https://openalex.org/W6637373629","https://openalex.org/W6745730985"],"related_works":["https://openalex.org/W2165367082","https://openalex.org/W1972641423","https://openalex.org/W611446063","https://openalex.org/W1996322406","https://openalex.org/W4206938017","https://openalex.org/W1967064512","https://openalex.org/W2388299947","https://openalex.org/W2382673458","https://openalex.org/W2361380273","https://openalex.org/W782612275"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"Deep":[3],"Neural":[4,29],"Networks":[5,30],"(DNNs)":[6],"have":[7,32,94],"achieved":[8],"state-of-the-art":[9],"results":[10,121,137],"in":[11,36,163],"various":[12],"fields":[13],"like":[14,38],"Computer":[15],"Vision,":[16],"Natural":[17],"Language":[18],"Processing":[19,59],"and":[20,41,68,72,91,105],"Speech":[21],"Recognition.":[22],"Of":[23],"all":[24],"the":[25,48,52,95,136,141,160,164,177],"DNN":[26],"architectures,":[27],"Convolutional":[28],"(CNNs)":[31],"been":[33],"most":[34],"effective":[35],"tasks":[37],"image":[39],"classification":[40],"object":[42],"detection.":[43],"The":[44,155],"high":[45],"performance":[46],"of":[47,54,138,140,176],"CNNs":[49,99],"comes":[50],"at":[51,153],"cost":[53],"computational":[55],"complexity.":[56],"Currently":[57],"Graphics":[58],"Units":[60],"(GPUs)":[61],"are":[62,78,86,101,132],"used":[63],"to":[64,97,118,127,134,158],"accelerate":[65],"CNN":[66],"training":[67],"inference":[69],"on":[70,146],"workstations":[71],"data":[73],"servers.":[74],"Though":[75],"popular,":[76],"GPUs":[77],"not":[79,87],"suitable":[80],"for":[81,103,171],"embedded":[82],"applications":[83],"because":[84],"they":[85],"energy":[88,104],"efficient.":[89],"ASIC":[90],"FPGA":[92],"accelerators":[93],"potential":[96],"run":[98,159],"that":[100],"optimized":[102],"performance.In":[106],"this":[107],"paper":[108],"we":[109],"present":[110],"an":[111,147],"architecture":[112,173],"which":[113],"takes":[114],"a":[115],"novel":[116],"approach":[117],"compute":[119],"convolution":[120,161],"using":[122],"row-wise":[123],"inputs":[124],"as":[125],"opposed":[126],"traditional":[128],"tile-based":[129],"processing.":[130],"We":[131],"able":[133],"exceed":[135],"state":[139,175],"art":[142,178],"architectures":[143],"when":[144],"implemented":[145],"inexpensive":[148],"PYNQ":[149],"Z1":[150],"board":[151],"running":[152],"100Mhz.":[154],"total":[156],"latency":[157],"layers":[162],"VGG16":[165],"benchmark":[166],"is":[167],"nearly":[168],"1.5x":[169],"lower":[170],"our":[172],"than":[174],"architectures.":[179]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
