{"id":"https://openalex.org/W7127715919","doi":"https://doi.org/10.48550/arxiv.2602.02848","title":"Zero Sum SVD: Balancing Loss Sensitivity for Low Rank LLM Compression","display_name":"Zero Sum SVD: Balancing Loss Sensitivity for Low Rank LLM Compression","publication_year":2026,"publication_date":"2026-02-02","ids":{"openalex":"https://openalex.org/W7127715919","doi":"https://doi.org/10.48550/arxiv.2602.02848"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.02848","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124998685","display_name":"Ali Abbasi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Abbasi, Ali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093329996","display_name":"Chayne Thrash","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thrash, Chayne","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101558909","display_name":"Haoran Qin","orcid":"https://orcid.org/0009-0008-4784-0943"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Haoran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125091144","display_name":"Shansita Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Shansita","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088963709","display_name":"Sepehr Seifi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seifi, Sepehr","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Kolouri, Soheil","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kolouri, Soheil","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5124998685"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.6723999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.6723999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.02410000003874302,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.02199999988079071,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.6887000203132629},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.6118999719619751},{"id":"https://openalex.org/keywords/sensitivity","display_name":"Sensitivity (control systems)","score":0.5964999794960022},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.5527999997138977},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5174999833106995},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5167999863624573},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4999000132083893},{"id":"https://openalex.org/keywords/homogeneous","display_name":"Homogeneous","score":0.46630001068115234},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4472000002861023}],"concepts":[{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.6887000203132629},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.6118999719619751},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6044999957084656},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5989000201225281},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.5964999794960022},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.5527999997138977},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5174999833106995},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5167999863624573},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4999000132083893},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.46630001068115234},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4472000002861023},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.42179998755455017},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.38760000467300415},{"id":"https://openalex.org/C90199385","wikidata":"https://www.wikidata.org/wiki/Q6692777","display_name":"Low-rank approximation","level":3,"score":0.37959998846054077},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3626999855041504},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.3513999879360199},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32670000195503235},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.31540000438690186},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C2988416141","wikidata":"https://www.wikidata.org/wiki/Q6031139","display_name":"Information loss","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.2587999999523163},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C2778459887","wikidata":"https://www.wikidata.org/wiki/Q6787865","display_name":"Matrix completion","level":3,"score":0.251800000667572},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.02848","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.02848","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.02848","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.02848","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Advances":[0],"in":[1,59,97],"large":[2,57],"language":[3],"models":[4],"have":[5],"driven":[6],"strong":[7],"performance":[8,34],"across":[9,103,164,171],"many":[10],"tasks,":[11],"but":[12],"their":[13],"memory":[14],"and":[15,25,92,174],"compute":[16],"costs":[17],"still":[18],"hinder":[19],"deployment.":[20],"SVD-based":[21],"compression":[22,44,175],"reduces":[23],"storage":[24],"can":[26],"speed":[27],"up":[28],"inference":[29],"via":[30],"low-rank":[31],"factors,":[32],"yet":[33],"depends":[35],"on":[36,64],"how":[37],"rank":[38,128,141],"is":[39,178],"allocated":[40],"under":[41],"a":[42,80,108,127,152],"global":[43],"ratio.":[45],"Prior":[46],"methods":[47],"often":[48],"use":[49],"homogeneous":[50],"ranks":[51,124],"for":[52],"similarly":[53],"sized":[54],"matrices,":[55],"despite":[56],"differences":[58],"loss":[60,95,117],"sensitivity,":[61],"or":[62],"rely":[63],"expensive":[65],"iterative":[66],"pre-truncation":[67],"optimization":[68],"to":[69],"determine":[70],"per":[71],"matrix":[72],"ranks.":[73],"We":[74],"propose":[75],"\\textbf{Zero":[76],"Sum":[77],"SVD}":[78],"(\\textbf{ZS-SVD}),":[79],"post-training":[81],"method":[82],"that":[83,112,134,150],"performs":[84],"\\emph{global}":[85],"singular":[86],"component":[87],"selection":[88],"using":[89],"activation":[90],"whitening":[91],"first-order":[93],"calibration":[94],"estimates":[96],"whitened":[98],"coordinates.":[99],"\\textbf{ZS-SVD}":[100],"prunes":[101],"components":[102],"the":[104,114],"whole":[105],"model":[106],"with":[107],"\\textbf{zero":[109],"sum}":[110],"rule":[111],"keeps":[113],"cumulative":[115],"predicted":[116],"change":[118],"near":[119,136],"zero,":[120],"automatically":[121],"yielding":[122],"heterogeneous":[123],"without":[125],"solving":[126],"allocation":[129],"optimization.":[130],"Motivated":[131],"by":[132,160],"evidence":[133],"gradients":[135],"pretrained":[137],"solutions":[138],"exhibit":[139],"low":[140],"structure,":[142],"we":[143],"also":[144],"introduce":[145],"an":[146],"optional":[147],"lightweight":[148],"correction":[149],"applies":[151],"\\textbf{single}":[153],"projected":[154],"gradient":[155],"update":[156],"after":[157],"truncation,":[158],"followed":[159],"re-truncation.":[161],"Extensive":[162],"experiments":[163],"multiple":[165],"LLM":[166],"architectures":[167],"show":[168],"consistent":[169],"gains":[170],"diverse":[172],"benchmarks":[173],"ratios.":[176],"Code":[177],"available":[179],"at":[180],"https://github.com/mint-vu/Zero-Sum-SVD":[181]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-06T00:00:00"}
