{"id":"https://openalex.org/W4406461638","doi":"https://doi.org/10.1109/slt61566.2024.10832205","title":"Rand: Robustness Aware Norm Decay for Quantized Neural Networks","display_name":"Rand: Robustness Aware Norm Decay for Quantized Neural Networks","publication_year":2024,"publication_date":"2024-12-02","ids":{"openalex":"https://openalex.org/W4406461638","doi":"https://doi.org/10.1109/slt61566.2024.10832205"},"language":"en","primary_location":{"id":"doi:10.1109/slt61566.2024.10832205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079902855","display_name":"David Qiu","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"David Qiu","raw_affiliation_strings":["Google, LLC"],"affiliations":[{"raw_affiliation_string":"Google, LLC","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053114931","display_name":"David Rim","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Rim","raw_affiliation_strings":["Google, LLC"],"affiliations":[{"raw_affiliation_string":"Google, LLC","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058886181","display_name":"Shaojin Ding","orcid":"https://orcid.org/0000-0002-2108-3111"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shaojin Ding","raw_affiliation_strings":["Google, LLC"],"affiliations":[{"raw_affiliation_string":"Google, LLC","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103149673","display_name":"Oleg Rybakov","orcid":"https://orcid.org/0009-0007-0021-047X"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oleg Rybakov","raw_affiliation_strings":["Google, LLC"],"affiliations":[{"raw_affiliation_string":"Google, LLC","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101319167","display_name":"Yanzhang He","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanzhang He","raw_affiliation_strings":["Google, LLC"],"affiliations":[{"raw_affiliation_string":"Google, LLC","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5079902855"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23836388,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1023","last_page":"1030"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6990020275115967},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5951102375984192},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5142085552215576},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36834269762039185},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.32304027676582336}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6990020275115967},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5951102375984192},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5142085552215576},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36834269762039185},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.32304027676582336},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/slt61566.2024.10832205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W854541894","https://openalex.org/W1494198834","https://openalex.org/W1522301498","https://openalex.org/W1922655562","https://openalex.org/W1945616565","https://openalex.org/W2113158412","https://openalex.org/W2119144962","https://openalex.org/W2242818861","https://openalex.org/W2250357346","https://openalex.org/W2319920447","https://openalex.org/W2497335382","https://openalex.org/W2526425061","https://openalex.org/W2777662428","https://openalex.org/W2799473636","https://openalex.org/W2803549871","https://openalex.org/W2892009249","https://openalex.org/W2962760690","https://openalex.org/W2962824709","https://openalex.org/W2963250244","https://openalex.org/W2963532001","https://openalex.org/W2964539095","https://openalex.org/W3007227084","https://openalex.org/W3015194534","https://openalex.org/W3017022649","https://openalex.org/W3028545098","https://openalex.org/W3030437843","https://openalex.org/W3035855442","https://openalex.org/W3036102031","https://openalex.org/W3095311338","https://openalex.org/W3097522836","https://openalex.org/W3097777922","https://openalex.org/W3101648800","https://openalex.org/W3139918052","https://openalex.org/W3154998900","https://openalex.org/W3163169798","https://openalex.org/W3176259480","https://openalex.org/W3196547485","https://openalex.org/W4221138270","https://openalex.org/W4223988178","https://openalex.org/W4224918069","https://openalex.org/W4281622880","https://openalex.org/W4287756219","https://openalex.org/W4293166090","https://openalex.org/W4293846201","https://openalex.org/W4297727296","https://openalex.org/W4306809345","https://openalex.org/W4311427561","https://openalex.org/W4385245566","https://openalex.org/W6623517193","https://openalex.org/W6631190155","https://openalex.org/W6640090968","https://openalex.org/W6640425456","https://openalex.org/W6677580257","https://openalex.org/W6690026940","https://openalex.org/W6691509046","https://openalex.org/W6700264148","https://openalex.org/W6747381837","https://openalex.org/W6760069825","https://openalex.org/W6767597771","https://openalex.org/W6771467084","https://openalex.org/W6775717222","https://openalex.org/W6776767859","https://openalex.org/W6779648490","https://openalex.org/W6779775157","https://openalex.org/W6779813529","https://openalex.org/W6791904447","https://openalex.org/W6810983866","https://openalex.org/W6838118415","https://openalex.org/W6842795023","https://openalex.org/W6847034171"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"With":[0],"the":[1,5,26,42,117,129,133,141,153,165,172],"rapid":[2],"increase":[3],"in":[4,189],"size":[6],"of":[7,17,33,44,68,92,125,128,177],"neural":[8],"networks,":[9],"model":[10,110,185],"compression":[11],"has":[12],"become":[13],"an":[14,21],"important":[15],"area":[16],"research.":[18],"Quantization":[19],"is":[20,95,107],"effective":[22],"technique":[23],"for":[24],"decreasing":[25],"size,":[27],"memory":[28],"access,":[29],"and":[30,136,149,168,192],"compute":[31],"load":[32],"large":[34],"models.":[35],"In":[36],"this":[37],"paper,":[38],"we":[39,113],"first":[40],"benchmark":[41],"impact":[43],"techniques":[45],"such":[46],"as":[47,80,82,119],"straight":[48],"through":[49],"estimator,":[50],"pseudo-quantization":[51],"noise":[52],"(PQN),":[53],"learnable":[54,101,147],"scale":[55,102,118,148],"parameter,":[56],"clipping,":[57],"etc.":[58],"on":[59,196],"4-bit":[60],"seq":[61,63],"2":[62],"models":[64],"across":[65],"a":[66,120,126,161,183],"suite":[67],"speech":[69],"recognition":[70],"datasets":[71],"ranging":[72],"from":[73],"1,000":[74],"hours":[75],"to":[76,87,109,115,155,174],"1":[77],"million":[78],"hours,":[79],"well":[81,188],"one":[83],"machine":[84],"translation":[85],"dataset":[86],"illustrate":[88],"its":[89,178],"applicability":[90],"outside":[91],"speech.":[93,199],"It":[94],"commonly":[96],"believed":[97],"that":[98,138,186],"having":[99],"dedicated":[100],"parameters":[103],"per":[104],"quantization":[105,134],"group":[106,135],"critical":[108],"accuracy.":[111],"Instead,":[112],"propose":[114],"construct":[116],"L<inf":[121],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[122],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">p</inf>":[123],"norm":[124,139],"few":[127],"largest":[130],"outliers":[131],"within":[132,140],"regularizing":[137],"end-to-end":[142],"optimization.":[143],"This":[144],"outperforms":[145],"popular":[146],"clipping":[150],"methods":[151],"without":[152],"need":[154],"introduce":[156],"extra":[157],"parameters.":[158],"PQN-QAT":[159],"shows":[160],"larger":[162],"improvement":[163],"under":[164],"proposed":[166],"method,":[167],"it":[169],"opens":[170],"up":[171],"potential":[173],"exploit":[175],"some":[176],"other":[179],"benefits:":[180],"1)":[181],"training":[182],"single":[184],"performs":[187],"mixed":[190],"precision":[191],"2)":[193],"improved":[194],"generalization":[195],"long":[197],"form":[198]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
