{"id":"https://openalex.org/W4382203393","doi":"https://doi.org/10.1109/tpds.2023.3290010","title":"APQ: Automated DNN Pruning and Quantization for ReRAM-Based Accelerators","display_name":"APQ: Automated DNN Pruning and Quantization for ReRAM-Based Accelerators","publication_year":2023,"publication_date":"2023-06-27","ids":{"openalex":"https://openalex.org/W4382203393","doi":"https://doi.org/10.1109/tpds.2023.3290010"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2023.3290010","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2023.3290010","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043851369","display_name":"Siling Yang","orcid":"https://orcid.org/0000-0002-2208-559X"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Siling Yang","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-2208-559X","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004997843","display_name":"Shuibing He","orcid":"https://orcid.org/0000-0002-7075-4153"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuibing He","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7075-4153","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101556035","display_name":"Hexiao Duan","orcid":"https://orcid.org/0009-0000-5130-7502"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hexiao Duan","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0000-5130-7502","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100681962","display_name":"Weijian Chen","orcid":"https://orcid.org/0000-0001-8296-2673"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weijian Chen","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-8296-2673","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084907146","display_name":"Xuechen Zhang","orcid":"https://orcid.org/0000-0002-3730-8901"},"institutions":[{"id":"https://openalex.org/I137317281","display_name":"Washington State University Vancouver","ror":"https://ror.org/00g2fk805","country_code":"US","type":"education","lineage":["https://openalex.org/I137317281","https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuechen Zhang","raw_affiliation_strings":["School of Engineering and Computer Science, Washington State University Vancouver, Vancouver, WA, USA"],"raw_orcid":"https://orcid.org/0000-0002-3730-8901","affiliations":[{"raw_affiliation_string":"School of Engineering and Computer Science, Washington State University Vancouver, Vancouver, WA, USA","institution_ids":["https://openalex.org/I137317281"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102002765","display_name":"Tong Wu","orcid":"https://orcid.org/0009-0003-0654-8245"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Wu","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0003-0654-8245","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101508047","display_name":"Yanlong Yin","orcid":"https://orcid.org/0009-0004-1505-4295"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanlong Yin","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0004-1505-4295","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5043851369"],"corresponding_institution_ids":["https://openalex.org/I168879160","https://openalex.org/I4210123185"],"apc_list":null,"apc_paid":null,"fwci":0.942,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.76856516,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"34","issue":"9","first_page":"2498","last_page":"2511"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7621864080429077},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.7176927328109741},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6575008630752563},{"id":"https://openalex.org/keywords/resistive-random-access-memory","display_name":"Resistive random-access memory","score":0.6403070688247681},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4731246829032898},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.45101502537727356},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.4304087162017822},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4101514220237732},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.34406328201293945},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3325055241584778},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.103883296251297}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7621864080429077},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.7176927328109741},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6575008630752563},{"id":"https://openalex.org/C182019814","wikidata":"https://www.wikidata.org/wiki/Q1143830","display_name":"Resistive random-access memory","level":3,"score":0.6403070688247681},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4731246829032898},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.45101502537727356},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.4304087162017822},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4101514220237732},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.34406328201293945},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3325055241584778},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.103883296251297},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C147789679","wikidata":"https://www.wikidata.org/wiki/Q11372","display_name":"Physical chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C17525397","wikidata":"https://www.wikidata.org/wiki/Q176140","display_name":"Electrode","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2023.3290010","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2023.3290010","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G4779957870","display_name":null,"funder_award_id":"62172361","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W2048266589","https://openalex.org/W2112796928","https://openalex.org/W2119144962","https://openalex.org/W2285660444","https://openalex.org/W2469490737","https://openalex.org/W2508602506","https://openalex.org/W2518281301","https://openalex.org/W2613989746","https://openalex.org/W2618530766","https://openalex.org/W2799229073","https://openalex.org/W2802367674","https://openalex.org/W2803549871","https://openalex.org/W2883149906","https://openalex.org/W2884150179","https://openalex.org/W2886851211","https://openalex.org/W2910506572","https://openalex.org/W2946659370","https://openalex.org/W2949674408","https://openalex.org/W2952899695","https://openalex.org/W2963273111","https://openalex.org/W2963723401","https://openalex.org/W2963864421","https://openalex.org/W2982479999","https://openalex.org/W3037288590","https://openalex.org/W3091895175","https://openalex.org/W3091922395","https://openalex.org/W3092032880","https://openalex.org/W3092513807","https://openalex.org/W3093326380","https://openalex.org/W3118608800","https://openalex.org/W3127794782","https://openalex.org/W3167436278","https://openalex.org/W4249545506","https://openalex.org/W4251775051","https://openalex.org/W4280615760","https://openalex.org/W4289761856","https://openalex.org/W4302570325","https://openalex.org/W4392271976","https://openalex.org/W6637373629","https://openalex.org/W6677580257","https://openalex.org/W6683826617","https://openalex.org/W6684205842","https://openalex.org/W6684921986","https://openalex.org/W6720242923","https://openalex.org/W6745722055","https://openalex.org/W6753146606","https://openalex.org/W6755509158","https://openalex.org/W6779885597","https://openalex.org/W6784315360","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W2054635671","https://openalex.org/W2931688134","https://openalex.org/W2545245183","https://openalex.org/W2377919138","https://openalex.org/W2378857091","https://openalex.org/W2350916061","https://openalex.org/W4256502920","https://openalex.org/W103652678","https://openalex.org/W2999756192","https://openalex.org/W4226090359"],"abstract_inverted_index":{"Emerging":[0],"ReRAM-based":[1,36,43,123,155,184],"accelerators":[2,44,185],"support":[3],"in-memory":[4],"computation":[5],"to":[6,21,58,63,75,133,153,186,192,196,208,231,250],"accelerate":[7],"deep":[8],"neural":[9],"network":[10],"(DNN)":[11],"inference.":[12],"Weight":[13],"matrix":[14],"pruning":[15,40,65,93,102,137],"is":[16],"a":[17,143,154,158,179],"widely":[18],"used":[19],"technique":[20,94],"reduce":[22,198],"the":[23,30,60,91,97,136,165,169,174,211,218,251],"size":[24],"of":[25,35,100,161,214,217],"DNN":[26,112,140,220],"models,":[27],"thereby":[28],"reducing":[29],"resource":[31,199],"and":[32,103,114,149,189,238],"energy":[33,240],"consumption":[34],"accelerators.":[37,124],"However,":[38],"existing":[39],"works":[41],"for":[42,122,139,142],"have":[45],"three":[46],"major":[47],"issues.":[48],"First,":[49,125],"they":[50,68,88],"use":[51,69],"heuristics":[52],"or":[53,71,244],"rules":[54],"from":[55],"domain":[56],"experts":[57],"prune":[59,76],"weights,":[61,77],"leading":[62],"sub-optimal":[64],"policies.":[66],"Second,":[67,146],"row":[70],"column-level":[72],"coarse-granularity":[73],"methods":[74],"resulting":[78],"in":[79,157,183],"poor":[80],"compression":[81,98,166,233],"rates":[82,167],"with":[83,168,242],"model":[84,247],"accuracy":[85,170],"constraints.":[86,171],"Third,":[87,195],"only":[89],"apply":[90],"weight":[92,151],"individually,":[95],"losing":[96],"opportunity":[99],"both":[101],"quantization.":[104],"In":[105],"this":[106],"article,":[107],"we":[108],"propose":[109],"an":[110],"Automated":[111],"Pruning":[113],"Quantization":[115],"framework,":[116],"named":[117],"<sc":[118,126,201,226],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[119,127,202,227],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">APQ</small>":[120,128,203,228],",":[121],"adopts":[129],"reinforcement":[130,206],"learning":[131,207],"(RL)":[132],"automatically":[134,209],"determine":[135,210],"policy":[138],"layers":[141],"global":[144],"optimum.":[145],"it":[147,177],"prunes":[148],"maps":[150],"matrices":[152],"accelerator":[156],"finer":[159],"granularity":[160],"column-vector,":[162],"which":[163],"improves":[164],"To":[172],"address":[173],"dislocation":[175],"problem,":[176],"uses":[178],"new":[180],"data":[181],"path":[182],"correctly":[187],"index":[188],"feed":[190],"input":[191],"matrix-vector":[193],"computation.":[194],"further":[197],"consumption,":[200],"also":[204],"leverages":[205],"quantization":[212],"bitwidth":[213],"each":[215],"layer":[216],"pruned":[219],"model.":[221],"Experimental":[222],"results":[223],"show":[224],"that,":[225],"achieves":[229],"up":[230],"4.52X":[232],"rate,":[234],"4.11X":[235],"area":[236],"efficiency,":[237],"4.51X":[239],"efficiency":[241],"similar":[243],"even":[245],"higher":[246],"accuracy,":[248],"compared":[249],"state-of-the-art":[252],"work.":[253]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
