{"id":"https://openalex.org/W2781078435","doi":"https://doi.org/10.1109/globalsip.2017.8309067","title":"A 200MHZ 202.4GFLOPS@10.8W VGG16 accelerator in Xilinx VX690T","display_name":"A 200MHZ 202.4GFLOPS@10.8W VGG16 accelerator in Xilinx VX690T","publication_year":2017,"publication_date":"2017-11-01","ids":{"openalex":"https://openalex.org/W2781078435","doi":"https://doi.org/10.1109/globalsip.2017.8309067","mag":"2781078435"},"language":"en","primary_location":{"id":"doi:10.1109/globalsip.2017.8309067","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globalsip.2017.8309067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Global Conference on Signal and Information Processing (GlobalSIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067104418","display_name":"Chunsheng Mei","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chunsheng Mei","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405183","display_name":"Zhenyu Liu","orcid":"https://orcid.org/0000-0003-0251-3267"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhenyu Liu","raw_affiliation_strings":["RIIT&TNList"],"affiliations":[{"raw_affiliation_string":"RIIT&TNList","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101472380","display_name":"Yue Niu","orcid":"https://orcid.org/0000-0002-1663-2921"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Niu","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024401174","display_name":"Xiangyang Ji","orcid":"https://orcid.org/0000-0002-7333-9975"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangyang Ji","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, 100084, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000288828","display_name":"Wei Zhou","orcid":"https://orcid.org/0000-0001-9715-6957"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhou","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi'an, 710072, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100450580","display_name":"Dongsheng Wang","orcid":"https://orcid.org/0000-0001-7676-7767"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dongsheng Wang","raw_affiliation_strings":["RIIT&TNList"],"affiliations":[{"raw_affiliation_string":"RIIT&TNList","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5067104418"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":1.0183,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.79175804,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"784","last_page":"788"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8110858201980591},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6964331269264221},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6173011064529419},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6048161387443542},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5739344954490662},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5116753578186035},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.4938724637031555},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.47279638051986694},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4076053500175476},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3911231458187103},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3272511959075928},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2722584307193756},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.0825147032737732}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8110858201980591},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6964331269264221},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6173011064529419},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6048161387443542},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5739344954490662},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5116753578186035},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.4938724637031555},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.47279638051986694},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4076053500175476},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3911231458187103},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3272511959075928},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2722584307193756},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0825147032737732},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/globalsip.2017.8309067","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globalsip.2017.8309067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Global Conference on Signal and Information Processing (GlobalSIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.41999998688697815,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1902041153","https://openalex.org/W1996901117","https://openalex.org/W2067523571","https://openalex.org/W2094756095","https://openalex.org/W2113724275","https://openalex.org/W2119144962","https://openalex.org/W2167215970","https://openalex.org/W2276486856","https://openalex.org/W2289252105","https://openalex.org/W2295680811","https://openalex.org/W2300242332","https://openalex.org/W2518546937","https://openalex.org/W2562773490","https://openalex.org/W2610691757","https://openalex.org/W2950248853","https://openalex.org/W2950967261","https://openalex.org/W2963056148","https://openalex.org/W2964299589","https://openalex.org/W4240168186","https://openalex.org/W4242577057"],"related_works":["https://openalex.org/W4315697128","https://openalex.org/W3102845713","https://openalex.org/W2971502891","https://openalex.org/W3205506801","https://openalex.org/W4280599700","https://openalex.org/W3183570023","https://openalex.org/W4382323155","https://openalex.org/W2016508734","https://openalex.org/W4287067436","https://openalex.org/W2986126107"],"abstract_inverted_index":{"Convolutional":[0],"Neural":[1],"Networks":[2],"(CNN)":[3],"are":[4],"among":[5],"the":[6,29,52,59,81,123],"most":[7],"powerful":[8],"and":[9,20,34,42,57,75,98,133],"widely":[10],"used":[11],"algorithms":[12],"for":[13],"computer":[14],"vision":[15],"applications,":[16],"notwithstanding":[17],"their":[18],"computation-demanding":[19],"memory-intensive":[21],"operations.":[22],"The":[23,66],"cumbersome":[24],"CNN":[25,109],"operation":[26],"stems":[27],"from":[28],"bulky":[30],"cross":[31],"channel":[32],"computation":[33],"massive":[35],"parameter":[36],"retrieving":[37],"of":[38,72,77],"convolutional":[39],"(CONV)":[40],"layers":[41,79],"fully-connected":[43,64,78],"(FC)":[44],"layers,":[45],"respectively.":[46],"In":[47,84],"this":[48],"paper,":[49],"to":[50],"remove":[51],"inter-filter":[53],"redundancy,":[54],"we":[55,104],"constructed":[56],"tuned":[58],"specific":[60],"low-rank":[61],"filters":[62],"in":[63,80],"layers.":[65],"proposed":[67],"rank":[68],"reduction":[69],"saves":[70],"88.9%":[71],"both":[73],"arithmetic":[74],"parameters":[76],"VGG16":[82],"model.":[83],"addition,":[85],"by":[86],"employing":[87],"network-layer-wise":[88],"ping-pong":[89],"DDR":[90],"access":[91],"mode,":[92],"tile-grain":[93],"on-chip":[94],"feature":[95],"map":[96],"buffers,":[97],"Propagate":[99],"Partial":[100],"Multiply-Accumulate":[101],"(PPMAC)":[102],"processor,":[103],"implemented":[105],"a":[106],"202.4":[107],"GFLOPS":[108],"accelerator":[110,124],"with":[111,129],"half-precision":[112],"data":[113],"format":[114],"on":[115],"Xilinx":[116],"VC709":[117],"evaluation":[118],"board.":[119],"Experiments":[120],"show":[121],"that":[122],"achieved":[125],"6.58":[126],"fps":[127],"throughput":[128],"0.7046":[130],"top-1":[131],"accuracy":[132,136],"0.8977":[134],"top-5":[135],"under":[137],"200MHz":[138],"working":[139],"frequency.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-03-10T14:07:55.174380","created_date":"2025-10-10T00:00:00"}
