{"id":"https://openalex.org/W7133619966","doi":"https://doi.org/10.48550/arxiv.2603.04359","title":"Dissecting Quantization Error: A Concentration-Alignment Perspective","display_name":"Dissecting Quantization Error: A Concentration-Alignment Perspective","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7133619966","doi":"https://doi.org/10.48550/arxiv.2603.04359"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.04359","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128192633","display_name":"Marco Federici","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Federici, Marco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018684838","display_name":"Boris van Breugel","orcid":"https://orcid.org/0009-0006-5125-0028"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"van Breugel, Boris","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103266146","display_name":"Paul N. Whatmough","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Whatmough, Paul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5111645310","display_name":"Markus Nagel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nagel, Markus","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.49230000376701355,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.49230000376701355,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0877000018954277,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.06750000268220901,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.85589998960495},{"id":"https://openalex.org/keywords/hadamard-transform","display_name":"Hadamard transform","score":0.685699999332428},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.5756999850273132},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.46230000257492065},{"id":"https://openalex.org/keywords/linde\u2013buzo\u2013gray-algorithm","display_name":"Linde\u2013Buzo\u2013Gray algorithm","score":0.40689998865127563},{"id":"https://openalex.org/keywords/covariance","display_name":"Covariance","score":0.38420000672340393}],"concepts":[{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.85589998960495},{"id":"https://openalex.org/C60292330","wikidata":"https://www.wikidata.org/wiki/Q1014065","display_name":"Hadamard transform","level":2,"score":0.685699999332428},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.5756999850273132},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5615000128746033},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4666999876499176},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45899999141693115},{"id":"https://openalex.org/C93372532","wikidata":"https://www.wikidata.org/wiki/Q6552455","display_name":"Linde\u2013Buzo\u2013Gray algorithm","level":3,"score":0.40689998865127563},{"id":"https://openalex.org/C178650346","wikidata":"https://www.wikidata.org/wiki/Q201984","display_name":"Covariance","level":2,"score":0.38420000672340393},{"id":"https://openalex.org/C5317259","wikidata":"https://www.wikidata.org/wiki/Q4462361","display_name":"Trellis quantization","level":5,"score":0.383899986743927},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3165999948978424},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31060001254081726},{"id":"https://openalex.org/C97137487","wikidata":"https://www.wikidata.org/wiki/Q729138","display_name":"Integer (computer science)","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.26489999890327454},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.259799987077713}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.04359","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.04359","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.04359","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.04359","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Quantization":[0],"can":[1,110],"drastically":[2],"increase":[3],"the":[4,47,66,78,93,166],"efficiency":[5],"of":[6,68,80,95],"large":[7],"language":[8],"and":[9,70,74,76,108,142],"vision":[10],"models,":[11],"but":[12],"typically":[13],"incurs":[14],"an":[15,87],"accuracy":[16],"drop.":[17],"Recently,":[18],"function-preserving":[19],"transforms":[20,98],"(e.g.":[21,99],"rotations,":[22],"Hadamard":[23],"transform,":[24],"channel-wise":[25],"scaling)":[26],"have":[27],"been":[28],"successfully":[29],"applied":[30],"to":[31,138],"reduce":[32,112],"post-training":[33],"quantization":[34,45,56,113,160],"error,":[35],"yet":[36],"a":[37,58,124,130,134],"principled":[38],"explanation":[39],"remains":[40],"elusive.":[41],"We":[42],"analyze":[43],"linear-layer":[44],"via":[46],"signal-to-quantization-noise":[48],"ratio":[49],"(SQNR),":[50],"showing":[51],"that":[52,128,152],"for":[53],"uniform":[54],"integer":[55],"at":[57,162],"fixed":[59],"bit":[60],"width,":[61],"SQNR":[62],"decomposes":[63],"into":[64],"(i)":[65],"concentration":[67,91,141],"weights":[69],"activations":[71],"(capturing":[72],"spread":[73],"outliers),":[75],"(ii)":[77],"alignment":[79,105],"their":[81],"dominant":[82],"variation":[83],"directions.":[84],"This":[85],"reveals":[86],"actionable":[88],"insight:":[89],"beyond":[90],"-":[92,103],"focus":[94],"most":[96],"prior":[97,158],"rotations":[100],"or":[101,156],"Hadamard)":[102],"improving":[104],"between":[106],"weight":[107],"activation":[109],"further":[111],"error.":[114],"Motivated":[115],"by":[116],"this,":[117],"we":[118],"introduce":[119],"block":[120],"Concentration-Alignment":[121],"Transforms":[122],"(CAT),":[123],"lightweight":[125],"linear":[126],"transformation":[127],"uses":[129],"covariance":[131],"estimate":[132],"from":[133],"small":[135],"calibration":[136],"set":[137],"jointly":[139],"improve":[140],"alignment,":[143],"approximately":[144],"maximizing":[145],"SQNR.":[146],"Experiments":[147],"across":[148],"several":[149],"LLMs":[150],"show":[151],"CAT":[153],"consistently":[154],"matches":[155],"outperforms":[157],"transform-based":[159],"methods":[161],"4-bit":[163],"precision,":[164],"confirming":[165],"insights":[167],"gained":[168],"in":[169],"our":[170],"framework.":[171]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-06T00:00:00"}
