{"id":"https://openalex.org/W4285250061","doi":"https://doi.org/10.1109/tcsi.2022.3178474","title":"A High Performance Multi-Bit-Width Booth Vector Systolic Accelerator for NAS Optimized Deep Learning Neural Networks","display_name":"A High Performance Multi-Bit-Width Booth Vector Systolic Accelerator for NAS Optimized Deep Learning Neural Networks","publication_year":2022,"publication_date":"2022-06-10","ids":{"openalex":"https://openalex.org/W4285250061","doi":"https://doi.org/10.1109/tcsi.2022.3178474"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2022.3178474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2022.3178474","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038495391","display_name":"Mingqiang Huang","orcid":"https://orcid.org/0000-0002-7794-3985"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingqiang Huang","raw_affiliation_strings":["Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-7794-3985","affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088097198","display_name":"Yucen Liu","orcid":"https://orcid.org/0000-0002-1174-5337"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yucen Liu","raw_affiliation_strings":["School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-1174-5337","affiliations":[{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056167336","display_name":"Changhai Man","orcid":"https://orcid.org/0000-0003-0693-3904"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changhai Man","raw_affiliation_strings":["School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-0693-3904","affiliations":[{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090865912","display_name":"Kai Li","orcid":"https://orcid.org/0000-0003-3251-931X"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Li","raw_affiliation_strings":["School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-3251-931X","affiliations":[{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046207386","display_name":"Quan Cheng","orcid":"https://orcid.org/0000-0001-5519-3258"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]},{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN","JP"],"is_corresponding":false,"raw_author_name":"Quan Cheng","raw_affiliation_strings":["Department of Communications and Computer Engineering, Kyoto University, Kyoto, Japan","School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5519-3258","affiliations":[{"raw_affiliation_string":"Department of Communications and Computer Engineering, Kyoto University, Kyoto, Japan","institution_ids":["https://openalex.org/I22299242"]},{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062269789","display_name":"Wei Mao","orcid":"https://orcid.org/0000-0003-2527-6778"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Mao","raw_affiliation_strings":["School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-2527-6778","affiliations":[{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034853402","display_name":"Hao Yu","orcid":"https://orcid.org/0000-0002-2674-4118"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Yu","raw_affiliation_strings":["School of Microelectronics, Southern University of Science and Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-2674-4118","affiliations":[{"raw_affiliation_string":"School of Microelectronics, Southern University of Science and Technology, Shenzhen, China","institution_ids":["https://openalex.org/I3045169105"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5038495391"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I3045169105","https://openalex.org/I4210145761"],"apc_list":null,"apc_paid":null,"fwci":4.5714,"has_fulltext":false,"cited_by_count":48,"citation_normalized_percentile":{"value":0.95944663,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"69","issue":"9","first_page":"3619","last_page":"3631"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7576700448989868},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6993374228477478},{"id":"https://openalex.org/keywords/systolic-array","display_name":"Systolic array","score":0.6507202386856079},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5904157757759094},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5411630272865295},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.5281184911727905},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5133211016654968},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.458008736371994},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.454303115606308},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.4182111918926239},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3748818635940552},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3623508810997009},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2838315963745117},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.26955652236938477},{"id":"https://openalex.org/keywords/very-large-scale-integration","display_name":"Very-large-scale integration","score":0.16133400797843933}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7576700448989868},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6993374228477478},{"id":"https://openalex.org/C150741067","wikidata":"https://www.wikidata.org/wiki/Q2377218","display_name":"Systolic array","level":3,"score":0.6507202386856079},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5904157757759094},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5411630272865295},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.5281184911727905},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5133211016654968},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.458008736371994},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.454303115606308},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4182111918926239},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3748818635940552},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3623508810997009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2838315963745117},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.26955652236938477},{"id":"https://openalex.org/C14580979","wikidata":"https://www.wikidata.org/wiki/Q876049","display_name":"Very-large-scale integration","level":2,"score":0.16133400797843933}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2022.3178474","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2022.3178474","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.6499999761581421}],"awards":[{"id":"https://openalex.org/G1490070647","display_name":null,"funder_award_id":"2018KCXTD028","funder_id":"https://openalex.org/F4320326279","funder_display_name":"Department of Education of Guangdong Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320326279","display_name":"Department of Education of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W2017369466","https://openalex.org/W2048266589","https://openalex.org/W2094756095","https://openalex.org/W2117539524","https://openalex.org/W2119293553","https://openalex.org/W2160815625","https://openalex.org/W2395611524","https://openalex.org/W2475840367","https://openalex.org/W2584311934","https://openalex.org/W2585560244","https://openalex.org/W2593564159","https://openalex.org/W2594492285","https://openalex.org/W2606722458","https://openalex.org/W2885527679","https://openalex.org/W2900228909","https://openalex.org/W2903260438","https://openalex.org/W2936278485","https://openalex.org/W2946355854","https://openalex.org/W2946572707","https://openalex.org/W2949619037","https://openalex.org/W2962860921","https://openalex.org/W2963367920","https://openalex.org/W2963526839","https://openalex.org/W2964259004","https://openalex.org/W2964504576","https://openalex.org/W2967733054","https://openalex.org/W2997958863","https://openalex.org/W2999241864","https://openalex.org/W3003453708","https://openalex.org/W3008072732","https://openalex.org/W3008515144","https://openalex.org/W3038838661","https://openalex.org/W3096533519","https://openalex.org/W3100543277","https://openalex.org/W3113827151","https://openalex.org/W3114917619","https://openalex.org/W3116917247","https://openalex.org/W3118404249","https://openalex.org/W3131458535","https://openalex.org/W4240639369","https://openalex.org/W6637373629","https://openalex.org/W6756887525","https://openalex.org/W6756979132"],"related_works":["https://openalex.org/W2999668243","https://openalex.org/W2347854075","https://openalex.org/W2132614232","https://openalex.org/W2518118925","https://openalex.org/W3159273459","https://openalex.org/W4283703276","https://openalex.org/W4319952061","https://openalex.org/W4280636456","https://openalex.org/W4388913998","https://openalex.org/W4310584535"],"abstract_inverted_index":{"Multi-bit-width":[0],"convolutional":[1,150],"neural":[2,38],"network":[3,9,45,66,141],"(CNN)":[4],"maintains":[5],"the":[6,43,62,90,98,111,136,149,174],"balance":[7],"between":[8],"accuracy":[10,64],"and":[11,101,145,165],"hardware":[12],"efficiency,":[13],"thus":[14],"enlightening":[15],"a":[16],"promising":[17],"method":[18,58],"for":[19,33,61,78,87,159,163,168],"accurate":[20],"yet":[21],"energy-efficient":[22],"edge":[23],"computing.":[24],"In":[25],"this":[26],"work,":[27],"we":[28],"develop":[29],"state-of-the-art":[30],"multi-bit-width":[31,44,65,72,118],"accelerator":[32,180],"NAS":[34,138],"Optimized":[35],"deep":[36],"learning":[37],"networks.":[39],"To":[40],"efficiently":[41],"process":[42],"inferencing,":[46],"multi-level":[47],"optimizations":[48],"have":[49],"been":[50,123],"proposed.":[51],"Firstly,":[52],"differential":[53],"Neural":[54],"Architecture":[55],"Search":[56],"(NAS)":[57],"is":[59,76,85,142,172],"adopted":[60],"high":[63,155],"generation.":[67],"Secondly,":[68],"hybrid":[69],"Booth":[70],"based":[71],"multiply-add-accumulation":[73],"(MAC)":[74],"unit":[75],"developed":[77],"data":[79],"processing.":[80],"Thirdly,":[81],"vector":[82],"systolic":[83,95,113],"array":[84],"proposed":[86,117],"effectively":[88],"accelerating":[89,135],"matrix":[91],"multiplications.":[92],"With":[93],"vector-style":[94],"dataflow,":[96],"both":[97],"processing":[99],"time":[100],"logic":[102],"resources":[103],"consumption":[104],"can":[105,152],"be":[106],"reduced":[107],"when":[108],"compared":[109],"with":[110],"classical":[112],"array.":[114],"Finally,":[115],"The":[116],"CNN":[119,179],"acceleration":[120],"scheme":[121],"has":[122],"practically":[124],"deployed":[125],"on":[126,134],"FPGA":[127],"platform":[128],"of":[129,148],"Xilinx":[130],"ZCU102.":[131],"Average":[132],"performance":[133,147],"full":[137],"optimized":[139],"VGG16":[140],"784.2":[143],"GOPS,":[144],"peek":[146],"layer":[151],"reach":[153],"as":[154,156],"871.26":[157],"GOPS":[158,162,167],"INT8,":[160],"1676.96":[161],"INT4,":[164],"2863.29":[166],"INT2":[169],"respectively,":[170],"which":[171],"among":[173],"best":[175],"results":[176],"in":[177],"previous":[178],"benchmarks.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":21},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":2}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
