{"id":"https://openalex.org/W3203678853","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534248","title":"CAQ: Context-Aware Quantization via Reinforcement Learning","display_name":"CAQ: Context-Aware Quantization via Reinforcement Learning","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3203678853","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534248","mag":"3203678853"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9534248","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534248","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026897667","display_name":"Zhijun Tu","orcid":"https://orcid.org/0000-0001-8740-7927"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhijun Tu","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034675932","display_name":"Jian Ma","orcid":"https://orcid.org/0000-0002-9269-1130"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Ma","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032104477","display_name":"Tian Xia","orcid":"https://orcid.org/0000-0002-2520-3731"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tian Xia","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103215955","display_name":"Wenzhe Zhao","orcid":"https://orcid.org/0009-0009-1517-9422"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenzhe Zhao","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044243518","display_name":"Pengju Ren","orcid":"https://orcid.org/0000-0003-1163-2014"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengju Ren","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047405956","display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Xi'an Jiaotong University, Xi'an, China","institution_ids":["https://openalex.org/I87445476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5026897667"],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":0.0961,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.40142157,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7649592161178589},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.729456901550293},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6833747029304504},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5412026047706604},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5071451663970947},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4570787250995636},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4479960799217224},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.42991945147514343},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32786184549331665},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13857492804527283}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7649592161178589},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.729456901550293},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6833747029304504},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5412026047706604},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5071451663970947},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4570787250995636},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4479960799217224},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.42991945147514343},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32786184549331665},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13857492804527283},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9534248","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534248","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6577951179","display_name":null,"funder_award_id":"2019B010153003","funder_id":"https://openalex.org/F4320336405","funder_display_name":"Special Project for Research and Development in Key areas of Guangdong Province"},{"id":"https://openalex.org/G8667147361","display_name":null,"funder_award_id":"61773307","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336405","display_name":"Special Project for Research and Development in Key areas of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W992687842","https://openalex.org/W1861492603","https://openalex.org/W2017957151","https://openalex.org/W2119144962","https://openalex.org/W2163605009","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2291160084","https://openalex.org/W2300242332","https://openalex.org/W2319920447","https://openalex.org/W2405920868","https://openalex.org/W2553303224","https://openalex.org/W2618530766","https://openalex.org/W2754084392","https://openalex.org/W2766839578","https://openalex.org/W2809624076","https://openalex.org/W2886851211","https://openalex.org/W2897049076","https://openalex.org/W2898755250","https://openalex.org/W2913318911","https://openalex.org/W2950141105","https://openalex.org/W2950726407","https://openalex.org/W2963122961","https://openalex.org/W2963150697","https://openalex.org/W2963163009","https://openalex.org/W2963864421","https://openalex.org/W2964217848","https://openalex.org/W2964259004","https://openalex.org/W2964299589","https://openalex.org/W2981751377","https://openalex.org/W2982479999","https://openalex.org/W2998218113","https://openalex.org/W3008255452","https://openalex.org/W3038470071","https://openalex.org/W4288601266","https://openalex.org/W4289401368","https://openalex.org/W6677580257","https://openalex.org/W6684921986","https://openalex.org/W6696798448","https://openalex.org/W6698200048","https://openalex.org/W6700264148","https://openalex.org/W6714058667","https://openalex.org/W6729956949","https://openalex.org/W6745499037","https://openalex.org/W6746698991","https://openalex.org/W6753069482","https://openalex.org/W6755246743","https://openalex.org/W6756887525","https://openalex.org/W6758082782"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2024136090","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W20361778"],"abstract_inverted_index":{"Model":[0],"quantization":[1,91],"is":[2,69],"a":[3,82,93,142,156,180,195],"crucial":[4],"step":[5],"for":[6,73,103],"porting":[7],"Deep":[8],"Neural":[9,160],"Networks":[10],"(DNNs)":[11],"on":[12,36,109,155,168,179,231],"embedded":[13],"devices":[14],"to":[15,61,101,119,124],"meet":[16],"the":[17,28,33,37,54,70,74,89,104,110,121,126,132,136,170,188,201,226],"limited":[18],"computation":[19],"and":[20,31,56,97,139,144,166,214,238],"storage":[21],"resources":[22],"requirement.":[23],"Traditional":[24],"methods":[25,49],"usually":[26],"obtain":[27],"scaling":[29,51,106,117],"factor":[30,52],"quantize":[32],"weights":[34],"based":[35,108],"information":[38],"of":[39,50,159],"single":[40,181],"layer.":[41],"However,":[42],"our":[43,153],"analysis":[44],"indicate":[45],"that":[46,225],"these":[47],"selection":[48],"overlook":[53],"differences":[55],"dependencies":[57],"among":[58],"layers,":[59],"leading":[60],"large":[62],"truncation":[63],"errors":[64],"or":[65],"zeroing":[66],"errors,":[67],"which":[68,87,198],"main":[71],"reason":[72],"performance":[75],"degradation.":[76],"To":[77],"this":[78],"end,":[79],"we":[80,114,222],"propose":[81],"Context-Aware":[83],"Quantization":[84],"(CAQ)":[85],"scheme,":[86],"formalizes":[88],"model":[90],"as":[92,235],"global":[94],"optimization":[95],"problem":[96],"leverages":[98],"reinforcement":[99],"learning":[100],"search":[102,122,127,172],"optimal":[105],"factors":[107,118],"entire":[111,171],"model.":[112],"Further,":[113],"adopt":[115],"shift-based":[116],"narrow":[120],"space":[123],"improve":[125],"efficiency,":[128],"additionally,":[129],"it":[130],"reduces":[131],"computational":[133],"complexity":[134],"during":[135],"inference":[137],"phase,":[138],"also":[140],"provides":[141],"simpler":[143],"more":[145],"robust":[146],"activation":[147],"calibration":[148],"solution.":[149],"We":[150],"extensively":[151],"test":[152],"scheme":[154,192],"wide":[157],"range":[158],"Networks,":[161],"including":[162],"ResNet":[163],"50/101/152,":[164],"InceptionV3":[165],"MobileNetV2":[167],"ImageNet,":[169],"process":[173],"only":[174],"takes":[175],"about":[176],"1":[177],"hour":[178],"GeForce":[182],"RTX":[183],"2080":[184],"Ti.":[185],"Compared":[186],"with":[187],"existed":[189],"methods,":[190],"Our":[191],"can":[193,228],"get":[194],"better":[196],"performance,":[197],"could":[199],"maintain":[200],"post-quantization":[202],"accuracy":[203],"loss":[204],"less":[205],"than":[206],"0.25%,":[207],"while":[208],"reducing":[209],"memory":[210],"footprint":[211],"by":[212,219],"5%-8%":[213],"multiply":[215],"accumulate":[216],"(MAC)":[217],"operations":[218],"2%-4%.":[220],"Besides,":[221],"further":[223],"show":[224],"CAQ":[227],"be":[229],"applied":[230],"other":[232],"tasks,":[233],"such":[234],"object":[236],"detection":[237],"segmentation.":[239]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
