{"id":"https://openalex.org/W4410552911","doi":"https://doi.org/10.23919/date64628.2025.10993198","title":"A Low-Power Mixed-Precision Integrated Multiply-Accumulate Architecture for Quantized Deep Neural Networks","display_name":"A Low-Power Mixed-Precision Integrated Multiply-Accumulate Architecture for Quantized Deep Neural Networks","publication_year":2025,"publication_date":"2025-03-31","ids":{"openalex":"https://openalex.org/W4410552911","doi":"https://doi.org/10.23919/date64628.2025.10993198"},"language":"en","primary_location":{"id":"doi:10.23919/date64628.2025.10993198","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10993198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113581365","display_name":"Xiaolu Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaolu Hu","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059647894","display_name":"Xinkuang Geng","orcid":"https://orcid.org/0000-0003-3673-237X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinkuang Geng","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103236320","display_name":"Zhigang Mao","orcid":"https://orcid.org/0000-0001-9431-9853"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhigang Mao","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005550142","display_name":"Jie Han","orcid":"https://orcid.org/0000-0002-8849-4994"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jie Han","raw_affiliation_strings":["University of Alberta,Department of Electrical and Computer Engineering,Edmonton,Canada"],"affiliations":[{"raw_affiliation_string":"University of Alberta,Department of Electrical and Computer Engineering,Edmonton,Canada","institution_ids":["https://openalex.org/I154425047"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019717600","display_name":"Honglan Jiang","orcid":"https://orcid.org/0000-0003-3705-4240"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Honglan Jiang","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Micro-Nano Electronics,Shanghai,China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5113581365"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":2.8414,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.90851723,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9135000109672546,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9135000109672546,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.6450945734977722},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5950137376785278},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5758363008499146},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.5414770245552063},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4939120411872864},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4193372130393982},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3526540696620941},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09834599494934082}],"concepts":[{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.6450945734977722},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5950137376785278},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5758363008499146},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.5414770245552063},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4939120411872864},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4193372130393982},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3526540696620941},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09834599494934082},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/date64628.2025.10993198","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date64628.2025.10993198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Design, Automation &amp;amp; Test in Europe Conference (DATE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.4000000059604645,"display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G5187170828","display_name":null,"funder_award_id":"RES0048688,RES0051374,RES0054326","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"},{"id":"https://openalex.org/G6329299072","display_name":null,"funder_award_id":"2022YFB4500200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2593564159","https://openalex.org/W2895531329","https://openalex.org/W2952857977","https://openalex.org/W2963367920","https://openalex.org/W2964504576","https://openalex.org/W2965976751","https://openalex.org/W2987956272","https://openalex.org/W3217237164","https://openalex.org/W4206957512","https://openalex.org/W4285257701","https://openalex.org/W4312910656","https://openalex.org/W4386076113","https://openalex.org/W4390833969","https://openalex.org/W4399487325","https://openalex.org/W4400811359","https://openalex.org/W4401568667","https://openalex.org/W4401568751","https://openalex.org/W6760069825","https://openalex.org/W6790078748","https://openalex.org/W6847478871"],"related_works":["https://openalex.org/W2588198209","https://openalex.org/W1909006023","https://openalex.org/W4205824991","https://openalex.org/W3200723557","https://openalex.org/W4312713546","https://openalex.org/W2362195430","https://openalex.org/W2347494122","https://openalex.org/W2567983276","https://openalex.org/W2802298219","https://openalex.org/W2038503502"],"abstract_inverted_index":{"As":[0],"mixed-precision":[1,20,32,65,72,196],"quantization":[2],"techniques":[3],"have":[4],"been":[5,59],"widely":[6],"considered":[7,60],"for":[8,164,189,207,279,294],"balancing":[9],"computational":[10],"efficiency":[11,51,253,257,278],"and":[12,97,109,162,167,254,262,285],"flexibility":[13],"in":[14,27,61,142,214,258],"quantized":[15],"deep":[16],"neural":[17],"networks":[18],"(DNNs),":[19],"multiply-accumulate":[21],"(MAC)":[22],"units":[23],"are":[24,231],"increasingly":[25],"important":[26],"DNN":[28],"accelerators.":[29],"However,":[30],"conventional":[31],"MAC":[33,73,151,197,216,236],"architectures":[34],"support":[35],"either":[36],"signed":[37,39,45],"\u00d7":[38,80,83,87,91,95,100],"or":[40],"unsigned":[41],"\u00d7unsigned":[42,46],"multiplications.":[43],"The":[44,125],"multiplication":[47,115,136,209],"enhancing":[48],"the":[49,62,107,114,130,135,149,156,173,177,234,250,268,276],"computing":[50,205],"of":[52,64,111,134],"DNNs":[53,240],"with":[54,172,267,271],"ReLU":[55],"activations":[56],"has":[57],"never":[58],"design":[63,174],"MAC.":[66],"Thus,":[67],"this":[68,103],"work":[69],"proposes":[70],"a":[71,215,243],"architecture":[74],"supporting":[75],"six":[76],"operation":[77,220,264,296],"modes,":[78,113,221],"int8":[79,82],"int8,":[81],"uint8,":[84],"two":[85,89],"int4":[86,90],"int4,":[88],"uint4,":[92],"four":[93,98,120],"int2":[94,99],"int2,":[96],"uint2.":[101],"In":[102],"design,":[104],"to":[105,137,193,223,238],"balance":[106],"power":[108,157,187],"delay":[110],"different":[112],"is":[116,127,210],"implemented":[117],"based":[118,175],"on":[119,176],"precision-split":[121],"4\u00d74":[122],"multipliers":[123],"(PS4Ms).":[124],"accumulation":[126,133],"integrated":[128],"into":[129],"partial":[131],"product":[132],"eliminate":[138],"redundant":[139],"switching":[140],"activities":[141],"separate":[143],"compression.":[144],"With":[145],"10%":[146],"area":[147,256],"reduction,":[148],"proposed":[150],"denoted":[152],"as":[153,224],"PS4MAC,":[154],"reduces":[155],"by":[158,282],"over":[159,185],"35%,":[160],"42%,":[161],"56%":[163],"8-bit,":[165,260],"4-bit,":[166,261],"2-bit":[168,263],"operations,":[169],"respectively,":[170],"compared":[171,192],"Synopsys":[178],"DesignWare":[179],"(DW)":[180],"multipliers.":[181],"Additionally,":[182],"it":[183],"achieves":[184,287],"23%":[186],"savings":[188],"8-bit":[190,208,280],"operations":[191,281],"state-of-the-art":[194],"(SotA)":[195],"designs.":[198],"To":[199],"save":[200],"more":[201],"power,":[202],"an":[203],"approximate":[204],"mode":[206],"further":[211],"designed,":[212],"resulting":[213],"unit":[217],"enabling":[218],"eight":[219],"referred":[222],"PS4MAC_AP.":[225],"Finally,":[226],"output-stationary":[227],"systolic":[228],"arrays":[229],"(SAs)":[230],"explored":[232],"using":[233],"above-mentioned":[235],"designs":[237,248],"implement":[239],"operating":[241],"under":[242],"1":[244],"GHz":[245],"clock.":[246],"Our":[247],"show":[249],"highest":[251],"energy":[252,277],"outstanding":[255],"all":[259,295],"modes.":[265,297],"Compared":[266],"traditional":[269],"SA":[270],"high-precision-split":[272],"multipliers,":[273],"PS4MAC_AP":[274],"improves":[275],"0.6":[283],"TOPS/W,":[284],"PS4MAC":[286],"0.4":[288],"TOPS/W":[289,292],"-":[290],"0.7":[291],"improvement":[293]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
