{"id":"https://openalex.org/W4398795071","doi":"https://doi.org/10.48550/arxiv.2405.13155","title":"ReALLM: A general framework for LLM compression and fine-tuning","display_name":"ReALLM: A general framework for LLM compression and fine-tuning","publication_year":2024,"publication_date":"2024-05-21","ids":{"openalex":"https://openalex.org/W4398795071","doi":"https://doi.org/10.48550/arxiv.2405.13155"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2405.13155","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.13155","pdf_url":"https://arxiv.org/pdf/2405.13155","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.13155","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041480387","display_name":"Louis Leconte","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Leconte, Louis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104228506","display_name":"Lisa Bedin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bedin, Lisa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100777903","display_name":"Van Minh Nguyen","orcid":"https://orcid.org/0000-0001-6475-6163"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Van Minh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101398712","display_name":"\u00c9ric Moulines","orcid":"https://orcid.org/0000-0002-2058-0693"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moulines, Eric","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5041480387"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9490000009536743,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9490000009536743,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.5751357674598694},{"id":"https://openalex.org/keywords/fine-tuning","display_name":"Fine-tuning","score":0.4373193681240082},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3941836655139923},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.27004122734069824},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11969000101089478},{"id":"https://openalex.org/keywords/composite-material","display_name":"Composite material","score":0.04950115084648132}],"concepts":[{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.5751357674598694},{"id":"https://openalex.org/C157524613","wikidata":"https://www.wikidata.org/wiki/Q2828883","display_name":"Fine-tuning","level":2,"score":0.4373193681240082},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3941836655139923},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.27004122734069824},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11969000101089478},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.04950115084648132},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2405.13155","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.13155","pdf_url":"https://arxiv.org/pdf/2405.13155","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2405.13155","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2405.13155","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.13155","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.13155","pdf_url":"https://arxiv.org/pdf/2405.13155","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4398795071.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"We":[0],"introduce":[1],"ReALLM,":[2],"a":[3,26,36,41,90,97,111,118,141,150,163],"novel":[4],"approach":[5],"for":[6,25,140],"compression":[7],"and":[8,22,40,96,117,138],"memory-efficient":[9],"adaptation":[10],"of":[11,18,28,71,110,143,152],"pre-trained":[12,62],"language":[13,134],"models":[14],"that":[15,61],"encompasses":[16],"most":[17],"the":[19,49,53,69,72,123,130],"post-training":[20],"quantization":[21,127],"fine-tuning":[23,50,161],"methods":[24],"budget":[27,142,151],"&lt;4":[29],"bits.":[30,107],"Pre-trained":[31],"matrices":[32,63],"are":[33,56],"decomposed":[34],"into":[35],"high-precision":[37],"low-rank":[38,54],"component":[39],"vector-quantized":[42],"latent":[43],"representation":[44],"(using":[45],"an":[46],"autoencoder).":[47],"During":[48],"step,":[51],"only":[52,114],"components":[55],"updated.":[57],"Our":[58,125],"results":[59,132],"show":[60],"exhibit":[64],"different":[65],"patterns.":[66],"ReALLM":[67,83,155],"adapts":[68],"shape":[70],"encoder":[73],"(small/large":[74],"embedding,":[75],"high/low":[76],"bit":[77],"VQ,":[78],"etc.)":[79],"to":[80,85],"each":[81,87],"matrix.":[82],"proposes":[84],"represent":[86],"matrix":[88,112],"with":[89,102,122],"small":[91,164],"embedding":[92,116],"on":[93,105,133,162],"$b$":[94],"bits":[95,145],"neural":[98],"decoder":[99],"model":[100],"$\\mathcal{D}_\u03d5$":[101],"its":[103],"weights":[104],"$b_\u03d5$":[106],"The":[108],"decompression":[109],"requires":[113],"one":[115],"single":[119],"forward":[120],"pass":[121],"decoder.":[124],"weight-only":[126],"algorithm":[128],"yields":[129],"best":[131],"generation":[135],"tasks":[136],"(C4":[137],"WikiText-2)":[139],"$3$":[144],"without":[146],"any":[147],"training.":[148],"With":[149],"$2$":[153],"bits,":[154],"achieves":[156],"state-of-the":[157],"art":[158],"performance":[159],"after":[160],"calibration":[165],"dataset.":[166]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
