{"id":"https://openalex.org/W7138094579","doi":"https://doi.org/10.1609/aaai.v40i18.38589","title":"RoSA: Enhancing Parameter-Efficient Fine-Tuning via RoPE-aware Selective Adaptation in Large Language Models","display_name":"RoSA: Enhancing Parameter-Efficient Fine-Tuning via RoPE-aware Selective Adaptation in Large Language Models","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138094579","doi":"https://doi.org/10.1609/aaai.v40i18.38589"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v40i18.38589","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38589","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38589/42551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38589/42551","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017085160","display_name":"Dayan Pan","orcid":"https://orcid.org/0009-0008-7712-8658"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Dayan Pan","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129686737","display_name":"Jingyuan Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyuan Wang","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China\nSchool of Economics and Management, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China\nSchool of Economics and Management, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129725697","display_name":"Yilong Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yilong Zhou","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129692954","display_name":"Jiawei Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]},{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Jiawei Cheng","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China\nDepartment of Data Science, City University of Hong Kong, Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China\nMOE Engineering Research Center of Advanced Computer Application Technology, Beihang University, China\nDepartment of Data Science, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I82880672","https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129676351","display_name":"Pengyue Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Pengyue Jia","raw_affiliation_strings":["Department of Data Science, City University of Hong Kong, Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Data Science, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129720509","display_name":"Xiangyu Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Xiangyu Zhao","raw_affiliation_strings":["Department of Data Science, City University of Hong Kong, Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Data Science, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5017085160"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28150262,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"18","first_page":"15600","last_page":"15608"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.38670000433921814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.38670000433921814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.10270000249147415,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.0786999985575676,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6287999749183655},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.6238999962806702},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.6230999827384949},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.48030000925064087},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.42980000376701355},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.36419999599456787},{"id":"https://openalex.org/keywords/selective-attention","display_name":"Selective attention","score":0.32350000739097595}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6988999843597412},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6287999749183655},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6238999962806702},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.6230999827384949},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5457000136375427},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.48030000925064087},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.42980000376701355},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.36419999599456787},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3287999927997589},{"id":"https://openalex.org/C2989146674","wikidata":"https://www.wikidata.org/wiki/Q4818236","display_name":"Selective attention","level":3,"score":0.32350000739097595},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.3231000006198883},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.31360000371932983},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2870999872684479},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1609/aaai.v40i18.38589","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38589","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38589/42551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:ojs.aaai.org:article/38589","is_oa":false,"landing_page_url":"https://ojs.aaai.org/index.php/AAAI/article/view/38589","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2159-5399","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i18.38589","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i18.38589","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38589/42551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1467331575","display_name":null,"funder_award_id":"72242101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2363765612","display_name":null,"funder_award_id":"72171013","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8299714314","display_name":null,"funder_award_id":"9229503","funder_id":"https://openalex.org/F4320309893","funder_display_name":"City University of Hong Kong"},{"id":"https://openalex.org/G8651611484","display_name":null,"funder_award_id":"72222022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320307285","display_name":"Impact Fund","ror":"https://ror.org/00jb20j87"},{"id":"https://openalex.org/F4320309893","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23"},{"id":"https://openalex.org/F4320316083","display_name":"Tencent","ror":"https://ror.org/00hhjss72"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138094579.pdf","grobid_xml":"https://content.openalex.org/works/W7138094579.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Fine-tuning":[0],"large":[1],"language":[2],"models":[3],"is":[4],"essential":[5],"for":[6],"task-specific":[7],"adaptation,":[8,129],"yet":[9],"it":[10],"remains":[11],"computationally":[12],"prohibitive.":[13],"Parameter-Efficient":[14],"Fine-Tuning":[15],"(PEFT)":[16],"methods":[17,151],"have":[18],"emerged":[19],"as":[20],"a":[21,69,78,86,103],"solution,":[22],"but":[23],"current":[24],"approaches":[25],"typically":[26],"ignore":[27],"the":[28,35,46,57,95,114],"distinct":[29],"roles":[30],"of":[31,60,98],"model":[32],"components":[33,97],"and":[34,81,102,112,134,142],"heterogeneous":[36],"importance":[37],"across":[38],"layers,":[39],"thereby":[40],"limiting":[41],"adaptation":[42],"efficiency.":[43],"Motivated":[44],"by":[45],"observation":[47],"that":[48,73,109,146],"Rotary":[49],"Position":[50],"Embeddings":[51],"(RoPE)":[52],"induce":[53],"critical":[54,116],"activations":[55],"in":[56,77],"low-frequency":[58,96],"dimensions":[59],"attention":[61,100],"states,":[62,101],"we":[63],"propose":[64],"RoPE-aware":[65,87],"Selective":[66],"Adaptation":[67],"(RoSA),":[68],"novel":[70],"PEFT":[71,150],"framework":[72],"allocates":[74],"trainable":[75,154],"parameters":[76],"more":[79,132],"targeted":[80,133],"effective":[82],"manner.":[83],"RoSA":[84,130,147],"comprises":[85],"Attention":[88],"Enhancement":[89],"(RoAE)":[90],"module,":[91],"which":[92],"selectively":[93],"enhances":[94],"RoPE-influenced":[99],"Dynamic":[104],"Layer":[105],"Selection":[106],"(DLS)":[107],"strategy":[108],"adaptively":[110],"identifies":[111],"updates":[113],"most":[115],"layers":[117],"based":[118],"on":[119,139],"LayerNorm":[120],"gradient":[121],"norms.":[122],"By":[123],"combining":[124],"dimension-wise":[125],"enhancement":[126],"with":[127],"layer-wise":[128],"achieves":[131],"efficient":[135],"fine-tuning.":[136],"Extensive":[137],"experiments":[138],"fifteen":[140],"commonsense":[141],"arithmetic":[143],"benchmarks":[144],"demonstrate":[145],"outperforms":[148],"mainstream":[149],"under":[152],"comparable":[153],"parameters.":[155]},"counts_by_year":[],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2026-03-18T00:00:00"}
