{"id":"https://openalex.org/W7140123693","doi":"https://doi.org/10.18653/v1/2026.findings-eacl.156","title":"FLAT-LLM: Fine-grained Low-rank Activation Space Transformation for Large Language Model Compression","display_name":"FLAT-LLM: Fine-grained Low-rank Activation Space Transformation for Large Language Model Compression","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7140123693","doi":"https://doi.org/10.18653/v1/2026.findings-eacl.156"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2026.findings-eacl.156","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.findings-eacl.156","pdf_url":"https://aclanthology.org/2026.findings-eacl.156.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: EACL 2026","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2026.findings-eacl.156.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jiayi Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiayi Tian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ryan Solgi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ryan Solgi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jinming Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinming Lu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yifan Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yifan Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Hai Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hai Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Zheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng Zhang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":19.5563,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.98802151,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2988","last_page":"3002"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.21089999377727509,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.21089999377727509,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.16179999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08470000326633453,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.4706000089645386},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.40540000796318054},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.38510000705718994},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.3659000098705292}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5091000199317932},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.4706000089645386},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.40540000796318054},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4041000008583069},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.38510000705718994},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.3659000098705292},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31859999895095825},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28839999437332153},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2572999894618988}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2026.findings-eacl.156","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.findings-eacl.156","pdf_url":"https://aclanthology.org/2026.findings-eacl.156.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: EACL 2026","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2026.findings-eacl.156","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.findings-eacl.156","pdf_url":"https://aclanthology.org/2026.findings-eacl.156.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: EACL 2026","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7140123693.pdf","grobid_xml":"https://content.openalex.org/works/W7140123693.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"enabled":[5],"remarkable":[6],"progress":[7],"in":[8,23,48,75,139],"natural":[9],"language":[10],"processing,":[11],"yet":[12],"their":[13],"high":[14],"computational":[15],"and":[16,46,64,97,112,131,141],"memory":[17],"demands":[18],"pose":[19],"challenges":[20],"for":[21,34],"deployment":[22],"resource-constrained":[24],"environments.Although":[25],"recent":[26],"low-rank":[27,73],"decomposition":[28],"methods":[29],"offer":[30],"a":[31,62,99,125],"promising":[32],"path":[33],"structural":[35,67,136],"compression,":[36],"they":[37],"often":[38],"suffer":[39],"from":[40],"accuracy":[41],"degradation,":[42],"expensive":[43],"calibration":[44,123],"procedures,":[45],"result":[47],"inefficient":[49],"model":[50],"architectures":[51],"that":[52],"hinder":[53],"real-world":[54],"inference":[55,146],"speedups.In":[56],"this":[57],"paper,":[58],"we":[59,79],"propose":[60],"FLAT-LLM,":[61],"fast":[63],"accurate,":[65],"training-free":[66],"compression":[68,115],"method":[69],"based":[70],"on":[71],"fine-grained":[72],"transformations":[74],"the":[76,81,86,122],"activation":[77],"space.Specifically,":[78],"reduce":[80],"hidden":[82],"dimension":[83],"by":[84],"transforming":[85],"weights":[87],"using":[88],"truncated":[89],"eigenvectors":[90],"computed":[91],"via":[92],"head-wise":[93],"Principal":[94],"Component":[95],"Analysis,":[96],"employ":[98],"greedy":[100],"budget":[101],"redistribution":[102],"strategy":[103],"to":[104],"adaptively":[105],"allocate":[106],"ranks":[107],"across":[108,128],"decoders.FLAT-LLM":[109],"achieves":[110],"efficient":[111],"effective":[113],"weight":[114],"without":[116],"recovery":[117],"fine-tuning,":[118],"which":[119],"could":[120],"complete":[121],"within":[124],"few":[126],"minutes.Evaluated":[127],"5":[129],"models":[130],"11":[132],"datasets,":[133],"FLAT-LLM":[134],"outperforms":[135],"pruning":[137],"baselines":[138],"generalization":[140],"downstream":[142],"performance,":[143],"while":[144],"delivering":[145],"speedups":[147],"over":[148],"low-rankbased":[149],"methods.":[150],"1":[151]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-11T00:00:00"}
