{"id":"https://openalex.org/W7127297662","doi":"https://doi.org/10.48550/arxiv.2602.00942","title":"SALAAD: Sparse And Low-Rank Adaptation via ADMM for Large Language Model Inference","display_name":"SALAAD: Sparse And Low-Rank Adaptation via ADMM for Large Language Model Inference","publication_year":2026,"publication_date":"2026-02-01","ids":{"openalex":"https://openalex.org/W7127297662","doi":"https://doi.org/10.48550/arxiv.2602.00942"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.00942","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124960171","display_name":"Hao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124912374","display_name":"Melis Ilayda Bal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bal, Melis Ilayda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124881050","display_name":"Liang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Liang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057208641","display_name":"Bingcong Li","orcid":"https://orcid.org/0000-0003-1958-4168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bingcong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124887017","display_name":"Niao He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Niao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037513714","display_name":"Melanie N. Zeilinger","orcid":"https://orcid.org/0000-0003-4570-7571"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeilinger, Melanie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049845074","display_name":"Michael Muehlebach","orcid":"https://orcid.org/0000-0002-7764-3069"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muehlebach, Michael","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5124960171"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.29840001463890076,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.29840001463890076,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.225600004196167,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.08839999884366989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5687000155448914},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5636000037193298},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5455999970436096},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5260000228881836},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5156000256538391},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5070000290870667},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.4113999903202057},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3917999863624573}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7498999834060669},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5687000155448914},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5636000037193298},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5455999970436096},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5260000228881836},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5156000256538391},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5070000290870667},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.4113999903202057},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3917999863624573},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3856000006198883},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.374099999666214},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.3483000099658966},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.31360000371932983},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29760000109672546},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.29499998688697815},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.2879999876022339},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.27300000190734863},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.25360000133514404},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2535000145435333}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.00942","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.00942","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.00942","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.00942","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"large":[1],"language":[2],"models":[3],"are":[4],"increasingly":[5],"deployed":[6],"under":[7,74],"compute":[8],"and":[9,23,30,42,64,79,90,148],"memory":[10,123,153],"constraints,":[11,92],"making":[12],"flexible":[13],"control":[14,104],"of":[15,97,108,143],"model":[16,59,110,116,144],"capacity":[17,29,111],"a":[18,53,135,140],"central":[19],"challenge.":[20],"While":[21],"sparse":[22,63],"low-rank":[24,65],"structures":[25,66],"naturally":[26],"trade":[27],"off":[28],"performance,":[31],"existing":[32],"approaches":[33],"often":[34],"rely":[35],"on":[36],"heuristic":[37],"designs":[38],"that":[39,61,84,119],"ignore":[40],"layer":[41],"matrix":[43],"heterogeneity":[44],"or":[45],"require":[46],"model-specific":[47],"architectural":[48],"modifications.":[49],"We":[50],"propose":[51],"SALAAD,":[52],"plug-and-play":[54],"framework":[55,78],"applicable":[56],"to":[57,131],"different":[58],"architectures":[60],"induces":[62],"during":[67,112,125],"training.":[68,113],"By":[69],"formulating":[70],"structured":[71],"weight":[72],"learning":[73],"an":[75,81],"augmented":[76],"Lagrangian":[77],"introducing":[80],"adaptive":[82],"controller":[83],"dynamically":[85],"balances":[86],"the":[87,95,106,156],"training":[88,99,137],"loss":[89],"structural":[91],"SALAAD":[93,120],"preserves":[94],"stability":[96],"standard":[98],"dynamics":[100],"while":[101,127],"enabling":[102,146],"explicit":[103],"over":[105],"evolution":[107],"effective":[109],"Experiments":[114],"across":[115,151],"scales":[117],"show":[118],"substantially":[121],"reduces":[122],"consumption":[124],"deployment":[126,150],"achieving":[128],"performance":[129],"comparable":[130],"ad-hoc":[132],"methods.":[133],"Moreover,":[134],"single":[136],"run":[138],"yields":[139],"continuous":[141],"spectrum":[142],"capacities,":[145],"smooth":[147],"elastic":[149],"diverse":[152],"budgets":[154],"without":[155],"need":[157],"for":[158],"retraining.":[159]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-04T00:00:00"}
