{"id":"https://openalex.org/W4402592728","doi":"https://doi.org/10.1109/taslp.2024.3463395","title":"Bayesian Parameter-Efficient Fine-Tuning for Overcoming Catastrophic Forgetting","display_name":"Bayesian Parameter-Efficient Fine-Tuning for Overcoming Catastrophic Forgetting","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402592728","doi":"https://doi.org/10.1109/taslp.2024.3463395"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3463395","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/taslp.2024.3463395","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"http://dx.doi.org/10.1109/taslp.2024.3463395","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048969380","display_name":"Haolin Chen","orcid":"https://orcid.org/0009-0005-0230-8169"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Haolin Chen","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081808619","display_name":"Philip N. Garner","orcid":"https://orcid.org/0000-0002-0814-1348"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Philip N. Garner","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5048969380"],"corresponding_institution_ids":["https://openalex.org/I7495430"],"apc_list":null,"apc_paid":null,"fwci":0.2624,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53527617,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"32","issue":null,"first_page":"4253","last_page":"4262"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9714000225067139,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9343000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.841280460357666},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.6315762996673584},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4179893732070923},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28926289081573486},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1846010684967041},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.14991697669029236}],"concepts":[{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.841280460357666},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.6315762996673584},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4179893732070923},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28926289081573486},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1846010684967041},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.14991697669029236}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2024.3463395","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/taslp.2024.3463395","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:infoscience.epfl.ch:20.500.14299/245710","is_oa":true,"landing_page_url":"https://infoscience.epfl.ch/handle/20.500.14299/245710","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"research article"}],"best_oa_location":{"id":"doi:10.1109/taslp.2024.3463395","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/taslp.2024.3463395","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Climate action","id":"https://metadata.un.org/sdg/13","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W2060277733","https://openalex.org/W2111051539","https://openalex.org/W2153914468","https://openalex.org/W2560647685","https://openalex.org/W2963748441","https://openalex.org/W2963846996","https://openalex.org/W2972359262","https://openalex.org/W2979826702","https://openalex.org/W3021931813","https://openalex.org/W3024869864","https://openalex.org/W3025844872","https://openalex.org/W3101498587","https://openalex.org/W3176828726","https://openalex.org/W3206816211","https://openalex.org/W4205991051","https://openalex.org/W4312210066","https://openalex.org/W4312933868","https://openalex.org/W4381786045","https://openalex.org/W4385569970","https://openalex.org/W4385570973","https://openalex.org/W4387941762","https://openalex.org/W4389520299","https://openalex.org/W4391833199","https://openalex.org/W6631190155","https://openalex.org/W6639024717","https://openalex.org/W6683107984","https://openalex.org/W6691459498","https://openalex.org/W6727099177","https://openalex.org/W6739785051","https://openalex.org/W6741217325","https://openalex.org/W6748278106","https://openalex.org/W6748453816","https://openalex.org/W6748588790","https://openalex.org/W6750615492","https://openalex.org/W6752294818","https://openalex.org/W6752540598","https://openalex.org/W6759579507","https://openalex.org/W6772349387","https://openalex.org/W6772650050","https://openalex.org/W6778883912","https://openalex.org/W6782104728","https://openalex.org/W6788175385","https://openalex.org/W6796581206","https://openalex.org/W6796823589","https://openalex.org/W6797067896","https://openalex.org/W6802744804","https://openalex.org/W6802833136","https://openalex.org/W6811340617","https://openalex.org/W6837789219","https://openalex.org/W6838639034","https://openalex.org/W6848221137","https://openalex.org/W6848735303","https://openalex.org/W6852246195","https://openalex.org/W6852811169","https://openalex.org/W6853937136","https://openalex.org/W6856154222","https://openalex.org/W6857244322","https://openalex.org/W6858637263","https://openalex.org/W6859583170"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W4289718052","https://openalex.org/W2164121020","https://openalex.org/W2145559838","https://openalex.org/W2905319430","https://openalex.org/W3116498279","https://openalex.org/W4287549553","https://openalex.org/W4310285384","https://openalex.org/W3183027292"],"abstract_inverted_index":{"We":[0,42],"are":[1],"motivated":[2],"primarily":[3],"by":[4,120],"the":[5,37,61,65,99,125,130,138,142],"adaptation":[6,101],"of":[7,64,76,137],"text-to-speech":[8],"synthesis":[9,83],"models;":[10],"however":[11],"we":[12,85],"argue":[13],"that":[14,44,114],"more":[15],"generic":[16],"parameter-efficient":[17],"fine-tuning":[18,126],"(PEFT)":[19],"is":[20],"an":[21,32],"appropriate":[22],"framework":[23],"to":[24,52,54,95],"do":[25],"such":[26],"adaptation.":[27],"Nevertheless,":[28],"catastrophic":[29,56,115],"forgetting":[30,57,116],"remains":[31],"issue":[33],"with":[34,98],"PEFT,":[35],"damaging":[36],"pre-trained":[38],"model's":[39],"inherent":[40],"capabilities.":[41],"demonstrate":[43,113],"existing":[45],"Bayesian":[46],"learning":[47],"techniques":[48],"can":[49,68,117],"be":[50,69,118],"applied":[51],"PEFT":[53,97],"prevent":[55],"as":[58,60],"long":[59],"parameter":[62],"shift":[63],"fine-tuned":[66],"layers":[67],"calculated":[70],"differentiably.":[71],"In":[72],"a":[73,134],"principled":[74],"series":[75],"experiments":[77],"on":[78],"language":[79],"modeling":[80],"and":[81,92,103,128],"speech":[82],"tasks,":[84],"utilize":[86],"established":[87],"Laplace":[88],"approximations,":[89],"including":[90],"diagonal":[91,143],"Kronecker-factored":[93,131],"approaches,":[94],"regularize":[96],"low-rank":[100],"(LoRA)":[102],"compare":[104],"their":[105],"performance":[106],"in":[107],"pre-training":[108,139],"knowledge":[109,140],"preservation.":[110],"Our":[111],"results":[112],"overcome":[119],"our":[121],"methods":[122],"without":[123],"degrading":[124],"performance,":[127],"using":[129],"approximation":[132],"produces":[133],"better":[135],"preservation":[136],"than":[141],"ones.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
