{"id":"https://openalex.org/W4409248530","doi":"https://doi.org/10.1109/hpca61900.2025.00059","title":"Panacea: Novel DNN Accelerator using Accuracy-Preserving Asymmetric Quantization and Energy-Saving Bit-Slice Sparsity","display_name":"Panacea: Novel DNN Accelerator using Accuracy-Preserving Asymmetric Quantization and Energy-Saving Bit-Slice Sparsity","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4409248530","doi":"https://doi.org/10.1109/hpca61900.2025.00059"},"language":"en","primary_location":{"id":"doi:10.1109/hpca61900.2025.00059","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00059","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064486180","display_name":"Dongyun Kam","orcid":"https://orcid.org/0000-0002-8542-1845"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Dongyun Kam","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028977510","display_name":"Myeongji Yun","orcid":"https://orcid.org/0009-0002-0538-6427"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Myeongji Yun","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061982705","display_name":"Sunwoo Yoo","orcid":null},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sunwoo Yoo","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101742717","display_name":"Seungwoo Hong","orcid":"https://orcid.org/0000-0003-2736-3955"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seungwoo Hong","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038110244","display_name":"Zhengya Zhang","orcid":"https://orcid.org/0000-0001-5963-9018"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhengya Zhang","raw_affiliation_strings":["University of Michigan"],"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048891431","display_name":"Youngjoo Lee","orcid":"https://orcid.org/0000-0002-2467-8276"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Youngjoo Lee","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064486180"],"corresponding_institution_ids":["https://openalex.org/I123900574"],"apc_list":null,"apc_paid":null,"fwci":2.3641,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.88118903,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"701","last_page":"715"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9488000273704529,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9488000273704529,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13182","display_name":"Quantum-Dot Cellular Automata","score":0.9290000200271606,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.7677699327468872},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7202164530754089},{"id":"https://openalex.org/keywords/panacea","display_name":"Panacea (medicine)","score":0.6229488849639893},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.542586624622345},{"id":"https://openalex.org/keywords/bit","display_name":"Bit (key)","score":0.4235967993736267},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40125560760498047},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.32620328664779663},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16236186027526855},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.08541938662528992},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.07465636730194092}],"concepts":[{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.7677699327468872},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7202164530754089},{"id":"https://openalex.org/C26993612","wikidata":"https://www.wikidata.org/wiki/Q910154","display_name":"Panacea (medicine)","level":3,"score":0.6229488849639893},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.542586624622345},{"id":"https://openalex.org/C117011727","wikidata":"https://www.wikidata.org/wiki/Q1278488","display_name":"Bit (key)","level":2,"score":0.4235967993736267},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40125560760498047},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.32620328664779663},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16236186027526855},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.08541938662528992},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.07465636730194092},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0},{"id":"https://openalex.org/C204787440","wikidata":"https://www.wikidata.org/wiki/Q188504","display_name":"Alternative medicine","level":2,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca61900.2025.00059","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00059","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8100000023841858,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322064","display_name":"Korea Institute for Advancement of Technology","ror":"https://ror.org/015w1qa96"},{"id":"https://openalex.org/F4320322202","display_name":"IC Design Education Center","ror":"https://ror.org/005v57z85"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W1677182931","https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2604319603","https://openalex.org/W2725159389","https://openalex.org/W2769502706","https://openalex.org/W2883920103","https://openalex.org/W2923014074","https://openalex.org/W2944869944","https://openalex.org/W2950865323","https://openalex.org/W2963122961","https://openalex.org/W2963367920","https://openalex.org/W2980186997","https://openalex.org/W2990295915","https://openalex.org/W3034940165","https://openalex.org/W3043504674","https://openalex.org/W3095319910","https://openalex.org/W3098068080","https://openalex.org/W3100985894","https://openalex.org/W3106171539","https://openalex.org/W3116917247","https://openalex.org/W3137147200","https://openalex.org/W3172129612","https://openalex.org/W3202442802","https://openalex.org/W4206016550","https://openalex.org/W4240168186","https://openalex.org/W4255949318","https://openalex.org/W4291653336","https://openalex.org/W4308083739","https://openalex.org/W4313069943","https://openalex.org/W4319996342","https://openalex.org/W4360831844","https://openalex.org/W4366341968","https://openalex.org/W4385300578","https://openalex.org/W4386075763","https://openalex.org/W4386076113","https://openalex.org/W4390873673","https://openalex.org/W4393406875","https://openalex.org/W4393407021","https://openalex.org/W4393407042","https://openalex.org/W6631943919","https://openalex.org/W6688979741","https://openalex.org/W6720242923","https://openalex.org/W6727099177","https://openalex.org/W6754503602","https://openalex.org/W6755207826","https://openalex.org/W6772383348","https://openalex.org/W6780343938","https://openalex.org/W6788001715","https://openalex.org/W6788135285","https://openalex.org/W6789240164","https://openalex.org/W6790521546","https://openalex.org/W6795991173","https://openalex.org/W6796815506","https://openalex.org/W6797854001","https://openalex.org/W6811340617","https://openalex.org/W6840088539","https://openalex.org/W6842758154","https://openalex.org/W6847478871","https://openalex.org/W6848451824","https://openalex.org/W6850162387","https://openalex.org/W6851828392","https://openalex.org/W6852337893","https://openalex.org/W6853436738","https://openalex.org/W6854866820","https://openalex.org/W6856449218","https://openalex.org/W6856696905","https://openalex.org/W6856969750","https://openalex.org/W6861133234","https://openalex.org/W6877022392"],"related_works":["https://openalex.org/W2791057018","https://openalex.org/W2100901739","https://openalex.org/W2073210364","https://openalex.org/W4242593755","https://openalex.org/W2123548032","https://openalex.org/W3204400881","https://openalex.org/W3214410901","https://openalex.org/W3204296682","https://openalex.org/W3183118997","https://openalex.org/W2917767146"],"abstract_inverted_index":{"Low":[0],"bit-precisions":[1],"and":[2,36,87,109,152,173,182,207,214,221,244,250,253,264],"their":[3,154],"bit-slice":[4,31,91,133,261],"sparsity":[5,32,160],"have":[6,63],"recently":[7],"been":[8],"studied":[9],"to":[10,56,99,130,203,217],"accelerate":[11],"general":[12],"matrix-multiplications":[13],"(GEMM)":[14],"during":[15],"large-scale":[16,113],"deep":[17],"neural":[18],"network":[19],"(DNN)":[20],"inferences.":[21],"While":[22],"the":[23,43,75,101,125,131,142,158,179,185,200,259,265],"conventional":[24],"symmetric":[25],"quantization":[26,67,78],"facilitates":[27],"low-resolution":[28],"processing":[29,97],"with":[30,276],"for":[33,51,68,112,124],"both":[34],"weight":[35],"activation,":[37],"its":[38,228],"accuracy":[39,59,108],"loss":[40],"caused":[41],"by":[42,89,149],"activation\u2019s":[44],"asymmetric":[45,66,77,150,277],"distributions":[46],"cannot":[47,84],"be":[48,85],"acceptable,":[49],"especially":[50],"largescale":[52],"DNNs.":[53],"In":[54,128],"efforts":[55],"mitigate":[57],"this":[58,116],"loss,":[60],"recent":[61,90,260],"studies":[62],"actively":[64],"utilized":[65],"activations":[69],"without":[70],"requiring":[71],"additional":[72],"operations.":[73,155],"However,":[74],"cuttingedge":[76],"produces":[79],"numerous":[80],"nonzero":[81,146],"slices":[82],"that":[83,235],"compressed":[86],"skipped":[88],"GEMM":[92,122],"accelerators,":[93,240],"naturally":[94],"consuming":[95],"more":[96],"energy":[98,248],"handle":[100],"quantized":[102],"DNN":[103,114,191,239],"models.To":[104],"simultaneously":[105],"achieve":[106],"high":[107],"hardware":[110,229],"efficiency":[111],"inferences,":[115],"paper":[117],"proposes":[118],"an":[119],"Asymmetrically-Quantized":[120],"bit-Slice":[121],"(AQS-GEMM)":[123],"first":[126],"time.":[127],"contrast":[129],"previous":[132],"computing,":[134],"which":[135,194],"only":[136],"skips":[137,153],"operations":[138],"of":[139,161,199],"zero":[140],"slices,":[141,147],"AQS-GEMM":[143,181,202],"compresses":[144],"frequent":[145],"generated":[148],"quantization,":[151],"To":[156,177],"increase":[157,204],"slicelevel":[159],"activations,":[162],"we":[163,187],"also":[164],"introduce":[165,189],"two":[166],"algorithm-hardware":[167],"co-optimization":[168],"methods:":[169],"a":[170,174,190,211],"zero-point":[171],"manipulation":[172],"distribution-based":[175],"bit-slicing.":[176],"support":[178],"proposed":[180],"optimizations":[183],"at":[184],"hardware-level,":[186],"newly":[188],"accelerator,":[192],"Panacea,":[193],"efficiently":[195],"handles":[196],"sparse/dense":[197],"workloads":[198],"tiled":[201],"data":[205,219],"reuse":[206,220],"utilization.":[208],"Panacea":[209,236],"supports":[210],"specialized":[212],"dataflow":[213],"run-length":[215],"encoding":[216],"maximize":[218],"minimize":[222],"external":[223],"memory":[224],"accesses,":[225],"significantly":[226],"improving":[227],"efficiency.":[230],"Numerous":[231],"benchmark":[232],"evaluations":[233],"show":[234],"outperforms":[237],"existing":[238],"e.g.,":[241],"$1.97":[242],"\\times$":[243,246,252,255],"$3.26":[245],"higher":[247,256],"efficiency,":[249],"$1.88":[251],"$2.41":[254],"throughput":[257],"than":[258],"accelerator":[262],"Sibia":[263],"SIMD":[266],"design,":[267],"respectively,":[268],"on":[269],"OPT-2.7B,":[270],"while":[271],"providing":[272],"better":[273],"algorithm":[274],"performance":[275],"quantization.":[278]},"counts_by_year":[{"year":2026,"cited_by_count":3}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
