{"id":"https://openalex.org/W3087810721","doi":"https://doi.org/10.1109/sips50750.2020.9195219","title":"Knowledge Distillation for Optimization of Quantized Deep Neural Networks","display_name":"Knowledge Distillation for Optimization of Quantized Deep Neural Networks","publication_year":2020,"publication_date":"2020-09-23","ids":{"openalex":"https://openalex.org/W3087810721","doi":"https://doi.org/10.1109/sips50750.2020.9195219","mag":"3087810721"},"language":"en","primary_location":{"id":"doi:10.1109/sips50750.2020.9195219","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sips50750.2020.9195219","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Workshop on Signal Processing Systems (SiPS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100705459","display_name":"Sungho Shin","orcid":"https://orcid.org/0000-0002-6155-7449"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Sungho Shin","raw_affiliation_strings":["Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011500561","display_name":"Yoonho Boo","orcid":"https://orcid.org/0000-0002-6656-4445"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yoonho Boo","raw_affiliation_strings":["Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113491293","display_name":"Wonyong Sung","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Wonyong Sung","raw_affiliation_strings":["Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100705459"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":1.0747,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.79891779,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.9409626722335815},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.8434333801269531},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.8209196329116821},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6834809184074402},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6662099361419678},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5024478435516357},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4817119240760803},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.45202210545539856},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1931953728199005},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.11733812093734741},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.0890008807182312}],"concepts":[{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.9409626722335815},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.8434333801269531},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.8209196329116821},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6834809184074402},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6662099361419678},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5024478435516357},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4817119240760803},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.45202210545539856},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1931953728199005},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.11733812093734741},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0890008807182312},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/sips50750.2020.9195219","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sips50750.2020.9195219","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Workshop on Signal Processing Systems (SiPS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8199999928474426,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1602122992","https://openalex.org/W1690739335","https://openalex.org/W1821462560","https://openalex.org/W2013305145","https://openalex.org/W2193413348","https://openalex.org/W2194775991","https://openalex.org/W2264905057","https://openalex.org/W2294370754","https://openalex.org/W2300242332","https://openalex.org/W2401231614","https://openalex.org/W2469490737","https://openalex.org/W2524428287","https://openalex.org/W2593221942","https://openalex.org/W2603699043","https://openalex.org/W2604342492","https://openalex.org/W2653504903","https://openalex.org/W2680270903","https://openalex.org/W2739879705","https://openalex.org/W2742947407","https://openalex.org/W2786951478","https://openalex.org/W2884001105","https://openalex.org/W2911803042","https://openalex.org/W2921712231","https://openalex.org/W2938965404","https://openalex.org/W2963140444","https://openalex.org/W2963249562","https://openalex.org/W2963318827","https://openalex.org/W2963521187","https://openalex.org/W2963723401","https://openalex.org/W2964118293","https://openalex.org/W2964137095","https://openalex.org/W2964203871","https://openalex.org/W2996834012","https://openalex.org/W6637551013","https://openalex.org/W6638523607","https://openalex.org/W6687566353","https://openalex.org/W6693066613","https://openalex.org/W6698200048","https://openalex.org/W6720242923","https://openalex.org/W6727208969","https://openalex.org/W6736274139","https://openalex.org/W6736587433","https://openalex.org/W6745722055","https://openalex.org/W6748131973","https://openalex.org/W6748163181","https://openalex.org/W6758589240"],"related_works":["https://openalex.org/W3107204728","https://openalex.org/W4287591324","https://openalex.org/W3108503355","https://openalex.org/W3090555870","https://openalex.org/W4226420367","https://openalex.org/W2962876041","https://openalex.org/W3022820045","https://openalex.org/W2801655600","https://openalex.org/W3005627584","https://openalex.org/W3170224572"],"abstract_inverted_index":{"Knowledge":[0],"distillation":[1,116],"(KD)":[2],"technique":[3,132],"that":[4,58,106],"utilizes":[5],"a":[6,12,108,119],"pretrained":[7],"teacher":[8,32,53,65,83,110,121],"model":[9,111],"for":[10,17,41,73,99,145],"training":[11,144],"student":[13],"network":[14,33,66,84],"is":[15,67],"exploited":[16],"the":[18,28,31,37,52,59,64,78,82,93,114,126,135],"optimization":[19],"of":[20,30,39,81,95,138],"quantized":[21,49,100],"deep":[22],"neural":[23],"networks":[24],"(QDNNs).":[25],"We":[26,43,123],"consider":[27],"choice":[29],"and":[34,48,140],"also":[35,124],"investigate":[36],"effect":[38],"hyperparameters":[40],"KD.":[42],"employ":[44],"several":[45],"large":[46,120],"floating-point":[47],"models":[50],"as":[51,118],"network.":[54],"The":[55],"experiment":[56],"shows":[57],"softmax":[60,79],"distribution":[61,80],"produced":[62],"by":[63,88],"more":[68],"important":[69],"than":[70],"its":[71],"performance":[72,117],"effective":[74],"KD":[75,97,147],"training.":[76,102],"Since":[77],"can":[85,112],"be":[86],"controlled":[87],"KD's":[89],"hyperparameters,":[90],"we":[91],"analyze":[92],"interrelationship":[94],"each":[96],"component":[98],"DNN":[101],"Our":[103],"experiments":[104],"show":[105],"even":[107],"small":[109],"achieve":[113],"same":[115],"model.":[122],"propose":[125],"gradual":[127],"soft":[128,141],"loss":[129],"reduction":[130],"(GSLR)":[131],"which":[133],"controls":[134],"mixing":[136],"ratio":[137],"hard":[139],"losses":[142],"during":[143],"robust":[146],"based":[148],"QDNN":[149],"optimization.":[150]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
