{"id":"https://openalex.org/W4402671248","doi":"https://doi.org/10.18653/v1/2024.acl-short.16","title":"AFLoRA: Adaptive Freezing of Low Rank Adaptation in Parameter Efficient Fine-Tuning of Large Models","display_name":"AFLoRA: Adaptive Freezing of Low Rank Adaptation in Parameter Efficient Fine-Tuning of Large Models","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402671248","doi":"https://doi.org/10.18653/v1/2024.acl-short.16"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2024.acl-short.16","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.acl-short.16","pdf_url":"https://aclanthology.org/2024.acl-short.16.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2024.acl-short.16.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015708634","display_name":"Zeyu Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zeyu Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087095284","display_name":"Souvik Kundu","orcid":"https://orcid.org/0000-0001-5815-8765"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Souvik Kundu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086133855","display_name":"Anni Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anni Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101321562","display_name":"Junrui Wan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junrui Wan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113149227","display_name":"Lianghao Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lianghao Jiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084205024","display_name":"Peter A. Beerel","orcid":"https://orcid.org/0000-0002-8283-0168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peter Beerel","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5015708634"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1615,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.89352606,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"161","last_page":"167"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9498000144958496,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9498000144958496,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9386000037193298,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.907800018787384,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.7387410402297974},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5981455445289612},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5577102899551392},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.40877819061279297},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3392822742462158},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24819394946098328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.21928200125694275},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.17667105793952942},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.0712791383266449},{"id":"https://openalex.org/keywords/optics","display_name":"Optics","score":0.06288880109786987},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.05399349331855774}],"concepts":[{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.7387410402297974},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5981455445289612},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5577102899551392},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.40877819061279297},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3392822742462158},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24819394946098328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21928200125694275},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.17667105793952942},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.0712791383266449},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.06288880109786987},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.05399349331855774},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2024.acl-short.16","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.acl-short.16","pdf_url":"https://aclanthology.org/2024.acl-short.16.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2024.acl-short.16","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.acl-short.16","pdf_url":"https://aclanthology.org/2024.acl-short.16.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5099999904632568,"id":"https://metadata.un.org/sdg/13","display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4402671248.pdf","grobid_xml":"https://content.openalex.org/works/W4402671248.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,25,33,45,50],"novel":[3,51],"parameter-efficient":[4],"finetuning":[5],"(PEFT)":[6],"method,":[7],"dubbed":[8],"as":[9,87,116],"adaptive":[10],"freezing":[11,52,143],"of":[12,28,40,83,107,125,135],"low":[13],"rank":[14],"adaptation":[15],"(AFLoRA).Specifically,":[16],"for":[17,145],"each":[18,39],"pre-trained":[19],"frozen":[20],"weight":[21],"tensor,":[22],"we":[23,54,74,128],"add":[24],"parallel":[26],"path":[27],"trainable":[29,102],"low-rank":[30],"matrices,":[31],"namely":[32],"down-projection":[34],"and":[35,67,92,141],"an":[36,80],"up-projection":[37],"matrix,":[38],"which":[41],"is":[42],"followed":[43],"by":[44],"feature":[46],"transformation":[47],"vector.Based":[48],"on":[49,89,131],"score,":[53],"then":[55],"incrementally":[56],"freeze":[57],"these":[58],"projection":[59,148],"matrices":[60],"during":[61],"fine-tuning":[62],"to":[63,85,98,113,118],"reduce":[64],"the":[65,90,122,132,142,146],"computation":[66],"alleviate":[68],"over-fitting.Our":[69],"experimental":[70],"results":[71],"demonstrate":[72],"that":[73],"can":[75,110],"achieve":[76],"state-of-theart":[77],"performance":[78],"with":[79],"average":[81,101],"improvement":[82,115],"up":[84,97,112],"1.09%":[86],"evaluated":[88],"GLUE":[91],"GSM8k":[93],"benchmark":[94],"while":[95],"yielding":[96],"9.5":[99],"fewer":[100],"parameters.While":[103],"compared":[104],"in":[105],"terms":[106],"runtime,":[108],"AFLoRA":[109],"yield":[111],"1.86":[114],"opposed":[117],"similar":[119],"PEFT":[120],"alternatives.Besides":[121],"practical":[123],"utility":[124],"our":[126],"approach,":[127],"provide":[129],"insights":[130],"trainability":[133],"requirements":[134],"LoRA":[136],"paths":[137],"at":[138],"different":[139,147],"modules":[140],"schedule":[144],"matrices.":[149]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-10-10T00:00:00"}
