{"id":"https://openalex.org/W4385573887","doi":"https://doi.org/10.18653/v1/2022.emnlp-main.540","title":"When does Parameter-Efficient Transfer Learning Work for Machine Translation?","display_name":"When does Parameter-Efficient Transfer Learning Work for Machine Translation?","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4385573887","doi":"https://doi.org/10.18653/v1/2022.emnlp-main.540"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2022.emnlp-main.540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.emnlp-main.540","pdf_url":"https://aclanthology.org/2022.emnlp-main.540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2022.emnlp-main.540.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063061204","display_name":"Ahmet \u00dcst\u00fcn","orcid":"https://orcid.org/0000-0002-1640-4291"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]},{"id":"https://openalex.org/I169381384","display_name":"University of Groningen","ror":"https://ror.org/012p63287","country_code":"NL","type":"education","lineage":["https://openalex.org/I169381384"]}],"countries":["GB","NL"],"is_corresponding":false,"raw_author_name":"Ahmet \u00dcst\u00fcn","raw_affiliation_strings":["University of Edinburgh","University of Groningen"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"University of Groningen","institution_ids":["https://openalex.org/I169381384"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024678824","display_name":"Asa Cooper Stickland","orcid":null},"institutions":[{"id":"https://openalex.org/I169381384","display_name":"University of Groningen","ror":"https://ror.org/012p63287","country_code":"NL","type":"education","lineage":["https://openalex.org/I169381384"]},{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB","NL"],"is_corresponding":true,"raw_author_name":"Asa Cooper Stickland","raw_affiliation_strings":["University of Edinburgh","University of Groningen"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"University of Groningen","institution_ids":["https://openalex.org/I169381384"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5024678824"],"corresponding_institution_ids":["https://openalex.org/I169381384","https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":0.1388,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.58881884,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"7919","last_page":"7933"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7396964430809021},{"id":"https://openalex.org/keywords/fine-tuning","display_name":"Fine-tuning","score":0.7250446677207947},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.6654086112976074},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5902321934700012},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5439417958259583},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.5414888858795166},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5362282395362854},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4641401171684265},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4248994290828705},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37750372290611267},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08036458492279053}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7396964430809021},{"id":"https://openalex.org/C157524613","wikidata":"https://www.wikidata.org/wiki/Q2828883","display_name":"Fine-tuning","level":2,"score":0.7250446677207947},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.6654086112976074},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5902321934700012},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5439417958259583},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.5414888858795166},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5362282395362854},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4641401171684265},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4248994290828705},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37750372290611267},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08036458492279053},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2022.emnlp-main.540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.emnlp-main.540","pdf_url":"https://aclanthology.org/2022.emnlp-main.540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2022.emnlp-main.540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2022.emnlp-main.540","pdf_url":"https://aclanthology.org/2022.emnlp-main.540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1934935867","display_name":null,"funder_award_id":"Engineering and Physical Sciences R","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G342899402","display_name":null,"funder_award_id":"16427","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3603589064","display_name":null,"funder_award_id":"EP/L016427/1)","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4437068315","display_name":"EPSRC Centre for Doctoral Training in Data Science","funder_award_id":"EP/L016427/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5288895031","display_name":null,"funder_award_id":"EPSRC Centre for Doctoral Training","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6244725262","display_name":null,"funder_award_id":"Centre for Doctoral Training","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6653872853","display_name":null,"funder_award_id":"EP/L016","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320320332","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90"},{"id":"https://openalex.org/F4320320933","display_name":"Rijksuniversiteit Groningen","ror":"https://ror.org/012p63287"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320337373","display_name":"Center for Information Technology","ror":"https://ror.org/03jh5a977"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385573887.pdf"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W630532510","https://openalex.org/W1522301498","https://openalex.org/W2184135559","https://openalex.org/W2250342921","https://openalex.org/W2739967986","https://openalex.org/W2744813330","https://openalex.org/W2805394970","https://openalex.org/W2887920589","https://openalex.org/W2933138175","https://openalex.org/W2952468927","https://openalex.org/W2958953787","https://openalex.org/W2962863357","https://openalex.org/W2963088995","https://openalex.org/W2963250244","https://openalex.org/W2963532001","https://openalex.org/W2964085268","https://openalex.org/W2964303773","https://openalex.org/W2970925270","https://openalex.org/W3001434439","https://openalex.org/W3093517588","https://openalex.org/W3093871477","https://openalex.org/W3096966601","https://openalex.org/W3101498587","https://openalex.org/W3103182178","https://openalex.org/W3105421296","https://openalex.org/W3153411045","https://openalex.org/W3153675281","https://openalex.org/W3153805297","https://openalex.org/W3166846774","https://openalex.org/W3168867926","https://openalex.org/W3169483174","https://openalex.org/W3173788106","https://openalex.org/W3174770825","https://openalex.org/W3175955584","https://openalex.org/W3176828726","https://openalex.org/W3186081172","https://openalex.org/W3197536862","https://openalex.org/W3199258042","https://openalex.org/W3205717164","https://openalex.org/W3205949070","https://openalex.org/W3212651325","https://openalex.org/W3213715161","https://openalex.org/W4205991051","https://openalex.org/W4221160905","https://openalex.org/W4224308101","https://openalex.org/W4280494215","https://openalex.org/W4286901653","https://openalex.org/W4287694131","https://openalex.org/W4293569541","https://openalex.org/W4301187301","https://openalex.org/W4322588812","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2883671469","https://openalex.org/W3037551068","https://openalex.org/W3023285645","https://openalex.org/W2794347674","https://openalex.org/W3023594376","https://openalex.org/W2972060578","https://openalex.org/W4285877427","https://openalex.org/W783305165","https://openalex.org/W4287802662","https://openalex.org/W4380558612"],"abstract_inverted_index":{"Parameter-efficient":[0],"fine-tuning":[1,30,109,164,178],"methods":[2],"(PEFTs)":[3],"offer":[4],"the":[5,111,123,129,141,180],"promise":[6],"of":[7,18,68,81,117,125,131,136],"adapting":[8],"large":[9],"pre-trained":[10,86,160,182],"models":[11],"while":[12],"only":[13],"tuning":[14],"a":[15,64,78,158,166],"small":[16,94],"number":[17,124],"parameters.":[19,120],"They":[20],"have":[21],"been":[22],"shown":[23],"to":[24,115],"be":[25],"competitive":[26],"with":[27,106,144,157,165],"full":[28,107,163,177],"model":[29,108,119,161],"for":[31,46,60,70,148,170,179],"many":[32],"downstream":[33],"tasks.":[34],"However,":[35],"prior":[36],"work":[37,43,59],"indicates":[38],"that":[39,90,154],"PEFTs":[40,58,69,132,145,156,175],"may":[41],"not":[42],"as":[44,122],"well":[45],"machine":[47],"translation":[48],"(MT),":[49],"and":[50,83,169],"there":[51],"is":[52],"no":[53],"comprehensive":[54,65],"study":[55,67],"showing":[56],"when":[57,110],"MT.":[61],"We":[62,88,152],"conduct":[63],"empirical":[66],"MT,":[71],"considering":[72],"(1)":[73],"various":[74],"parameter":[75,112],"budgets,":[76],"(2)":[77],"diverse":[79],"set":[80],"language-pairs,":[82],"(3)":[84],"different":[85],"models.":[87],"find":[89,153],"\u2018adapters\u2019,":[91],"in":[92],"which":[93],"feed-forward":[95],"networks":[96],"are":[97,102],"added":[98],"after":[99],"every":[100],"layer,":[101],"indeed":[103],"on":[104,140],"par":[105],"budget":[113],"corresponds":[114],"10%":[116],"total":[118],"Nevertheless,":[121],"tuned":[126],"parameters":[127],"decreases,":[128],"performance":[130],"decreases.":[133],"The":[134],"magnitude":[135],"this":[137],"decrease":[138],"depends":[139],"language":[142],"pair,":[143],"particularly":[146],"struggling":[147],"distantly":[149],"related":[150],"language-pairs.":[151],"using":[155],"larger":[159],"outperforms":[162],"smaller":[167,171],"model,":[168],"training":[172],"data":[173],"sizes,":[174],"outperform":[176],"same":[181],"model.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
