{"id":"https://openalex.org/W7138785421","doi":"https://doi.org/10.1609/aaai.v40i39.40608","title":"Put the Space of LoRA Initialization to the Extreme to Preserve Pre-trained Knowledge","display_name":"Put the Space of LoRA Initialization to the Extreme to Preserve Pre-trained Knowledge","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138785421","doi":"https://doi.org/10.1609/aaai.v40i39.40608"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i39.40608","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40608","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40608/44569","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40608/44569","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002276656","display_name":"Pengwei Tang","orcid":"https://orcid.org/0009-0000-9839-5570"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pengwei Tang","raw_affiliation_strings":["Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China,\nBeijing Key Laboratory of Research on Large Models and Intelligent Governance,\nEngineering Research Center of Next-Generation Intelligent Search and Recommendation, MOE,"],"affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China,\nBeijing Key Laboratory of Research on Large Models and Intelligent Governance,\nEngineering Research Center of Next-Generation Intelligent Search and Recommendation, MOE,","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129652440","display_name":"Xiaolin Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Xiaolin Hu","raw_affiliation_strings":["Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University,"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen University,","institution_ids":["https://openalex.org/I4210094876"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129670613","display_name":"Yong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Liu","raw_affiliation_strings":["Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China,\nBeijing Key Laboratory of Research on Large Models and Intelligent Governance,\nEngineering Research Center of Next-Generation Intelligent Search and Recommendation, MOE,"],"affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China,\nBeijing Key Laboratory of Research on Large Models and Intelligent Governance,\nEngineering Research Center of Next-Generation Intelligent Search and Recommendation, MOE,","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129695848","display_name":"Lizhong Ding","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lizhong Ding","raw_affiliation_strings":["Beijing Institute of Technology,"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology,","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129752148","display_name":"Dongjie Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I862669128","display_name":"Xiaomi (China)","ror":"https://ror.org/029f7bn57","country_code":"CN","type":"company","lineage":["https://openalex.org/I862669128"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongjie Zhang","raw_affiliation_strings":["Xiaohongshu Inc.,"],"affiliations":[{"raw_affiliation_string":"Xiaohongshu Inc.,","institution_ids":["https://openalex.org/I862669128"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129738975","display_name":"Xing Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xing Wu","raw_affiliation_strings":["Xiaohongshu Inc.,\nInstitute of Information Engineering, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Xiaohongshu Inc.,\nInstitute of Information Engineering, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129658529","display_name":"Debing Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I862669128","display_name":"Xiaomi (China)","ror":"https://ror.org/029f7bn57","country_code":"CN","type":"company","lineage":["https://openalex.org/I862669128"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Debing Zhang","raw_affiliation_strings":["Xiaohongshu Inc.,"],"affiliations":[{"raw_affiliation_string":"Xiaohongshu Inc.,","institution_ids":["https://openalex.org/I862669128"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5002276656"],"corresponding_institution_ids":["https://openalex.org/I4210100255"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70074946,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"39","first_page":"33232","last_page":"33240"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6061000227928162,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.6061000227928162,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11029999703168869,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.07119999825954437,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.9544000029563904},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.560699999332428},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5601999759674072},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5152999758720398},{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.42579999566078186},{"id":"https://openalex.org/keywords/prior-information","display_name":"Prior information","score":0.3269999921321869}],"concepts":[{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.9544000029563904},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6888999938964844},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.560699999332428},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5601999759674072},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5152999758720398},{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.42579999566078186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32919999957084656},{"id":"https://openalex.org/C3020402766","wikidata":"https://www.wikidata.org/wiki/Q104376712","display_name":"Prior information","level":2,"score":0.3269999921321869},{"id":"https://openalex.org/C2777348039","wikidata":"https://www.wikidata.org/wiki/Q6423397","display_name":"Knowledge space","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C203763787","wikidata":"https://www.wikidata.org/wiki/Q371029","display_name":"Null (SQL)","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.30649998784065247},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30410000681877136},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.2888999879360199},{"id":"https://openalex.org/C148043351","wikidata":"https://www.wikidata.org/wiki/Q4456944","display_name":"Current (fluid)","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2621000111103058},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.260699987411499}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i39.40608","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40608","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40608/44569","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i39.40608","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40608","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/40608/44569","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5033180117607117}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138785421.pdf","grobid_xml":"https://content.openalex.org/works/W7138785421.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Low-Rank":[0],"Adaptation":[1],"(LoRA)":[2],"is":[3,64,71,84,96,190],"the":[4,59,79,82,91,97,105,114,125,135,144,153,163,170,185,217,229],"leading":[5],"parameter-efficient":[6],"fine-tuning":[7,238],"method":[8,212],"for":[9],"Large":[10],"Language":[11],"Models":[12],"(LLMs),":[13],"but":[14],"it":[15],"still":[16],"suffers":[17],"from":[18,162],"catastrophic":[19,31],"forgetting.":[20,32],"Recent":[21],"work":[22],"has":[23],"shown":[24],"that":[25,90,169,201,213,225],"specialized":[26],"LoRA":[27,39,62,94,115,215],"initialization":[28,40,63,95,116],"can":[29],"alleviate":[30],"There":[33],"are":[34,176],"currently":[35],"two":[36],"approaches":[37],"to":[38,53,66,76,99,119,132,200],"aimed":[41],"at":[42],"preventing":[43],"knowledge":[44,102,140,197,232],"forgetting":[45],"during":[46],"fine-tuning:":[47],"(1)":[48],"making":[49,113],"residual":[50,106],"weights":[51,158],"close":[52],"pre-trained":[54,67,101,120,129,133,139,157,182,196,230],"weights,":[55,134],"and":[56,193],"(2)":[57],"ensuring":[58],"space":[60,92,117,127,187,219],"of":[61,81,93,128,138,146,173,181,188,202,220,233],"orthogonal":[65,118],"knowledge.":[68],"The":[69],"former":[70],"what":[72],"current":[73,164],"methods":[74,109],"strive":[75],"achieve,":[77],"while":[78,156,235],"importance":[80],"latter":[83],"not":[85],"sufficiently":[86],"recognized.":[87],"We":[88],"find":[89,168],"key":[98],"preserving":[100],"rather":[103],"than":[104,179],"weights.":[107,121,130,183,203],"Existing":[108],"like":[110],"MiLoRA":[111,123],"propose":[112],"However,":[122],"utilizes":[124],"null":[126,186,218],"Compared":[131],"input":[136,154,174],"activations":[137,175,189],"take":[141],"into":[142],"account":[143],"parameters":[145],"all":[147],"previous":[148],"layers":[149],"as":[150,152,240],"well":[151],"data,":[155],"only":[159],"contain":[160],"information":[161,198],"layer.":[165],"Moreover,":[166],"we":[167,207],"effective":[171],"ranks":[172],"much":[177],"smaller":[178],"those":[180],"Thus,":[184],"more":[191],"accurate":[192],"contains":[194],"less":[195],"compared":[199],"Based":[204],"on":[205],"these,":[206],"introduce":[208],"LoRA-Null,":[209],"our":[210],"proposed":[211],"initializes":[214],"in":[216],"activations.":[221],"Experimental":[222],"results":[223],"show":[224],"LoRA-Null":[226],"effectively":[227],"preserves":[228],"world":[231],"LLMs":[234],"achieving":[236],"good":[237],"performance,":[239],"evidenced":[241],"by":[242],"extensive":[243],"experiments.":[244]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
