{"id":"https://openalex.org/W7155043582","doi":"https://doi.org/10.48550/arxiv.2604.18117","title":"LoRaQ: Optimized Low Rank Approximation for 4-bit Quantization","display_name":"LoRaQ: Optimized Low Rank Approximation for 4-bit Quantization","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W7155043582","doi":"https://doi.org/10.48550/arxiv.2604.18117"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18117","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18117","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18117","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134137754","display_name":"Yann Bouquet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bouquet, Yann","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082105097","display_name":"Alireza Khodamoradi","orcid":"https://orcid.org/0000-0001-8811-2258"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khodamoradi, Alireza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134190554","display_name":"Sophie Y\u00e1ng Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Sophie Y\u00e1ng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035560671","display_name":"Kristof Denolf","orcid":"https://orcid.org/0000-0001-6668-4562"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Denolf, Kristof","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049300388","display_name":"Mathieu Salzmann","orcid":"https://orcid.org/0000-0002-8347-8637"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Salzmann, Mathieu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.1745000034570694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.1745000034570694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.14920000731945038,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.07090000063180923,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.8256999850273132},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3790999948978424},{"id":"https://openalex.org/keywords/approximation-algorithm","display_name":"Approximation algorithm","score":0.36250001192092896},{"id":"https://openalex.org/keywords/shaping","display_name":"Shaping","score":0.3303999900817871},{"id":"https://openalex.org/keywords/approximation-theory","display_name":"Approximation theory","score":0.3257000148296356},{"id":"https://openalex.org/keywords/linear-approximation","display_name":"Linear approximation","score":0.32109999656677246}],"concepts":[{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.8256999850273132},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5613999962806702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4659999907016754},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4643000066280365},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3790999948978424},{"id":"https://openalex.org/C148764684","wikidata":"https://www.wikidata.org/wiki/Q621751","display_name":"Approximation algorithm","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C142311740","wikidata":"https://www.wikidata.org/wiki/Q1066177","display_name":"Shaping","level":2,"score":0.3303999900817871},{"id":"https://openalex.org/C145242015","wikidata":"https://www.wikidata.org/wiki/Q774123","display_name":"Approximation theory","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C160824197","wikidata":"https://www.wikidata.org/wiki/Q2071054","display_name":"Linear approximation","level":3,"score":0.32109999656677246},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.30399999022483826},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C122383733","wikidata":"https://www.wikidata.org/wiki/Q865920","display_name":"Approximation error","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.2540999948978424},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18117","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18117","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18117","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18117","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.40086257457733154,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Post-training":[0],"quantization":[1,16,74],"(PTQ)":[2],"is":[3],"essential":[4],"for":[5,56,81,134],"deploying":[6],"large":[7],"diffusion":[8],"transformers":[9],"on":[10,52,116],"resource-constrained":[11],"hardware,":[12],"but":[13],"aggressive":[14],"4-bit":[15],"significantly":[17],"degrades":[18],"generative":[19],"performance.":[20,37],"Low-rank":[21],"approximation":[22],"methods":[23,111],"have":[24],"emerged":[25],"as":[26,129],"a":[27,67,139,148],"promising":[28],"solution":[29],"by":[30],"appending":[31],"auxiliary":[32],"linear":[33],"branches":[34,44],"to":[35,97],"restore":[36],"However,":[38],"current":[39],"state-of-the-art":[40,110],"approaches":[41],"assume":[42],"these":[43],"must":[45],"retain":[46],"high":[47],"precision":[48],"(W16A16)":[49],"and":[50,118,132],"rely":[51],"heavy,":[53],"data-dependent":[54],"calibration":[55,70],"initialization.":[57],"We":[58,100,120],"challenge":[59],"both":[60],"limitations":[61],"with":[62,153],"LoRaQ":[63,84,107],"(Low-Rank":[64],"Approximated":[65],"Quantization),":[66],"simple,":[68],"data-free":[69],"approach":[71],"that":[72,126],"optimizes":[73],"error":[75],"compensation.":[76],"By":[77],"overcoming":[78],"the":[79,86,93,109,135],"need":[80],"high-precision":[82],"branches,":[83],"enables":[85],"first":[87],"fully":[88,149],"sub-16":[89],"bit":[90],"pipeline,":[91],"allowing":[92],"low-rank":[94,136],"branch":[95],"itself":[96],"be":[98],"quantized.":[99],"demonstrate":[101],"that,":[102],"at":[103],"equal":[104],"memory":[105],"overhead,":[106],"outperforms":[108],"in":[112],"their":[113],"native":[114],"implementations":[115],"Pixart-$\u03a3$":[117],"SANA.":[119],"also":[121],"analyze":[122],"mixed-precision":[123,155],"configurations,":[124],"showing":[125],"setups":[127],"such":[128],"W8A8,":[130],"W6A6,":[131],"W4A8":[133],"branch,":[137],"alongside":[138],"W4":[140],"main":[141],"layer,":[142],"yield":[143],"superior":[144],"results":[145],"while":[146],"maintaining":[147],"quantized":[150],"architecture":[151],"compatible":[152],"modern":[154],"hardware.":[156]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-22T00:00:00"}
