{"id":"https://openalex.org/W4404133677","doi":"https://doi.org/10.1145/3649329.3655986","title":"Drift: Leveraging Distribution-based Dynamic Precision Quantization for Efficient Deep Neural Network Acceleration","display_name":"Drift: Leveraging Distribution-based Dynamic Precision Quantization for Efficient Deep Neural Network Acceleration","publication_year":2024,"publication_date":"2024-06-23","ids":{"openalex":"https://openalex.org/W4404133677","doi":"https://doi.org/10.1145/3649329.3655986"},"language":"en","primary_location":{"id":"doi:10.1145/3649329.3655986","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3649329.3655986","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 61st ACM/IEEE Design Automation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103253476","display_name":"Lian Liu","orcid":"https://orcid.org/0000-0003-2226-2303"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lian Liu","raw_affiliation_strings":["CICS, Institute of Computing Technology, CAS, Beijing, Beijing, China","University of Chinese Academy of Sciences, Beijing, China","Zhongguancun National Laboratory, Beijing, China"],"affiliations":[{"raw_affiliation_string":"CICS, Institute of Computing Technology, CAS, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210090176"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Zhongguancun National Laboratory, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100532497","display_name":"Xu Zhaohui","orcid":"https://orcid.org/0009-0003-8334-6903"},"institutions":[{"id":"https://openalex.org/I30809798","display_name":"ShanghaiTech University","ror":"https://ror.org/030bhh786","country_code":"CN","type":"education","lineage":["https://openalex.org/I30809798"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaohui Xu","raw_affiliation_strings":["School of Information Science and Technology, ShanghaiTech University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, ShanghaiTech University, Shanghai, China","institution_ids":["https://openalex.org/I30809798"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090389605","display_name":"Yintao He","orcid":"https://orcid.org/0000-0003-3054-0617"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yintao He","raw_affiliation_strings":["SKLP, Institute of Computing Technology, Chinese Academy of Sciences, Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SKLP, Institute of Computing Technology, Chinese Academy of Sciences, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100346965","display_name":"Ying Wang","orcid":"https://orcid.org/0000-0001-5172-4736"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Wang","raw_affiliation_strings":["CICS, Institute of Computing Technology, CAS, Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"CICS, Institute of Computing Technology, CAS, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210090176"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100768288","display_name":"Huawei Li","orcid":"https://orcid.org/0000-0001-8082-4218"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huawei Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023380073","display_name":"Xiaowei Li","orcid":"https://orcid.org/0000-0002-0874-814X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaowei Li","raw_affiliation_strings":["ICT, Chinese Academy of Sciences, Beijing, NA, China"],"affiliations":[{"raw_affiliation_string":"ICT, Chinese Academy of Sciences, Beijing, NA, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016864694","display_name":"Yinhe Han","orcid":"https://orcid.org/0000-0003-0904-6681"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinhe Han","raw_affiliation_strings":["Institute of Computing Technology,Chinese Academy of Sciences, Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology,Chinese Academy of Sciences, Beijing, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5103253476"],"corresponding_institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":1.3901,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.84971065,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9778000116348267,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.761803388595581},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.7587769031524658},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6794026494026184},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5868072509765625},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47984835505485535},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.46423712372779846},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.25574952363967896},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10375893115997314}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.761803388595581},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.7587769031524658},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6794026494026184},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5868072509765625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47984835505485535},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.46423712372779846},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25574952363967896},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10375893115997314},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3649329.3655986","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3649329.3655986","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 61st ACM/IEEE Design Automation Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W2963367920","https://openalex.org/W3043504674","https://openalex.org/W3097528158","https://openalex.org/W3098576111","https://openalex.org/W3213241618","https://openalex.org/W4214634256","https://openalex.org/W4280582299","https://openalex.org/W4389163074"],"related_works":["https://openalex.org/W2565094479","https://openalex.org/W2390829436","https://openalex.org/W1989791859","https://openalex.org/W602859758","https://openalex.org/W1971289376","https://openalex.org/W2379101322","https://openalex.org/W1992553864","https://openalex.org/W2776207444","https://openalex.org/W2726447019","https://openalex.org/W2006439817"],"abstract_inverted_index":{"Quantization":[0],"is":[1],"one":[2],"of":[3,23,34,49],"the":[4,20,32,45,54,89],"most":[5],"hardware-efficient":[6],"ways":[7],"to":[8,43,70,108,139],"reduce":[9,72],"inference":[10],"costs":[11,74],"for":[12],"deep":[13],"neural":[14],"network":[15],"(DNN)":[16],"models.":[17,79,125,146],"Nevertheless,":[18],"with":[19,92,117,143],"continuous":[21],"increase":[22],"DNN":[24,61,78,90,119],"model":[25],"sizes":[26],"(240\u00d7":[27],"in":[28,57],"two":[29],"years)":[30],"and":[31,47,104,123,134],"emergence":[33],"large":[35],"language":[36],"models,":[37,62,120],"existing":[38,84,140],"static":[39],"quantization":[40,68],"methods":[41],"fail":[42],"utilize":[44],"sparsity":[46],"redundancy":[48],"models":[50,91],"sufficiently.":[51],"Motivated":[52],"by":[53],"pervasive":[55],"dynamism":[56],"data":[58],"tensors":[59],"across":[60],"we":[63,81,98],"propose":[64],"a":[65,100],"dynamic":[66,93,111],"precision":[67,112],"algorithm":[69],"further":[71],"computational":[73],"beyond":[75],"statically":[76,144],"quantized":[77,145],"Furthermore,":[80],"find":[82],"that":[83,129],"precision-flexible":[85,141],"accelerators":[86,142],"cannot":[87],"support":[88,110],"precision.":[94],"To":[95],"this":[96],"end,":[97],"design":[99],"novel":[101],"accelerator,":[102],"Drift,":[103],"achieve":[105],"online":[106],"scheduling":[107],"efficiently":[109],"execution.":[113],"We":[114],"conduct":[115],"experiments":[116],"various":[118],"including":[121],"CNN-based":[122],"Transformer-based":[124],"Evaluation":[126],"results":[127],"show":[128],"Drift":[130],"achieves":[131],"2.85\u00d7":[132],"speedup":[133],"3.12\u00d7":[135],"energy":[136],"saving":[137],"compared":[138]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
