{"id":"https://openalex.org/W2798465082","doi":"https://doi.org/10.18653/v1/p18-2104","title":"Adaptive Knowledge Sharing in Multi-Task Learning: Improving Low-Resource Neural Machine Translation","display_name":"Adaptive Knowledge Sharing in Multi-Task Learning: Improving Low-Resource Neural Machine Translation","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2798465082","doi":"https://doi.org/10.18653/v1/p18-2104","mag":"2798465082"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p18-2104","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2104","pdf_url":"https://www.aclweb.org/anthology/P18-2104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P18-2104.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047560089","display_name":"Poorya Zaremoodi","orcid":null},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Poorya Zaremoodi","raw_affiliation_strings":["Faculty of Information Technology, Monash University, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Monash University, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005792924","display_name":"Wray Buntine","orcid":"https://orcid.org/0000-0001-9292-1015"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Wray Buntine","raw_affiliation_strings":["Faculty of Information Technology, Monash University, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Monash University, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081525024","display_name":"Gholamreza Haffari","orcid":"https://orcid.org/0000-0001-7326-8380"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Gholamreza Haffari","raw_affiliation_strings":["Faculty of Information Technology, Monash University, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Monash University, Australia","institution_ids":["https://openalex.org/I56590836"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5047560089"],"corresponding_institution_ids":["https://openalex.org/I56590836"],"apc_list":null,"apc_paid":null,"fwci":6.7688,"has_fulltext":true,"cited_by_count":57,"citation_normalized_percentile":{"value":0.97373729,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"656","last_page":"661"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8435022234916687},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7831239700317383},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7082762122154236},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5945965647697449},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5577603578567505},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4927089512348175},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4691939055919647},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4566144347190857},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4175235629081726},{"id":"https://openalex.org/keywords/vietnamese","display_name":"Vietnamese","score":0.4117524325847626},{"id":"https://openalex.org/keywords/shared-resource","display_name":"Shared resource","score":0.41058871150016785},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08752909302711487}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8435022234916687},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7831239700317383},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7082762122154236},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5945965647697449},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5577603578567505},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4927089512348175},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4691939055919647},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4566144347190857},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4175235629081726},{"id":"https://openalex.org/C103621254","wikidata":"https://www.wikidata.org/wiki/Q9199","display_name":"Vietnamese","level":2,"score":0.4117524325847626},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.41058871150016785},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08752909302711487},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/p18-2104","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2104","pdf_url":"https://www.aclweb.org/anthology/P18-2104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},{"id":"pmh:oai:monash.edu:publications/52131f3b-7d95-4a63-92ec-0e31bcb0e97a","is_oa":true,"landing_page_url":"https://research.monash.edu/en/publications/52131f3b-7d95-4a63-92ec-0e31bcb0e97a","pdf_url":"https://researchmgt.monash.edu/ws/files/247466786/247466565_oa.pdf","source":{"id":"https://openalex.org/S4306402625","display_name":"Monash University Research Portal (Monash University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I56590836","host_organization_name":"Monash University","host_organization_lineage":["https://openalex.org/I56590836"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Zaremoodi, P, Buntine, W & Haffari, G 2018, Adaptive knowledge sharing in multi-task learning : improving low-resource neural machine translation. in I Gurevych & Y Miyao (eds), ACL 2018 - The 56th Annual Meeting of the Association for Computational Linguistics : Proceedings of the Conference, Vol. 2 (Short Papers). Association for Computational Linguistics (ACL), Stroudsburg PA USA, pp. 656-661, Annual Meeting of the Association of Computational Linguistics 2018, Melbourne, Victoria, Australia, 15/07/18. < http://aclweb.org/anthology/P18-2104 >","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"doi:10.18653/v1/p18-2104","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2104","pdf_url":"https://www.aclweb.org/anthology/P18-2104.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7716553812","display_name":"Learning Deep Semantics for Automatic Translation between Human Languages","funder_award_id":"DP160102686","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"},{"id":"https://openalex.org/G7837352088","display_name":null,"funder_award_id":"Data61","funder_id":"https://openalex.org/F4320320386","funder_display_name":"Commonwealth Scientific and Industrial Research Organisation"}],"funders":[{"id":"https://openalex.org/F4320310145","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95"},{"id":"https://openalex.org/F4320310207","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33"},{"id":"https://openalex.org/F4320320386","display_name":"Commonwealth Scientific and Industrial Research Organisation","ror":"https://ror.org/03qn8fb07"},{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2798465082.pdf","grobid_xml":"https://content.openalex.org/works/W2798465082.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W630532510","https://openalex.org/W1522301498","https://openalex.org/W1632114991","https://openalex.org/W1869752048","https://openalex.org/W1902237438","https://openalex.org/W2101105183","https://openalex.org/W2124807415","https://openalex.org/W2133564696","https://openalex.org/W2149327368","https://openalex.org/W2157331557","https://openalex.org/W2550821151","https://openalex.org/W2561274697","https://openalex.org/W2577255746","https://openalex.org/W2595715041","https://openalex.org/W2617039999","https://openalex.org/W2758310181","https://openalex.org/W2773621464","https://openalex.org/W2799920282","https://openalex.org/W2952339051","https://openalex.org/W2962717763","https://openalex.org/W2962784628","https://openalex.org/W2963069010","https://openalex.org/W2963333747","https://openalex.org/W2963393838","https://openalex.org/W2963506925","https://openalex.org/W2964116568","https://openalex.org/W2964121744","https://openalex.org/W2964308564","https://openalex.org/W3204406378","https://openalex.org/W4293718192","https://openalex.org/W4297730607"],"related_works":["https://openalex.org/W2901286616","https://openalex.org/W2291461084","https://openalex.org/W2050882094","https://openalex.org/W3113733647","https://openalex.org/W4206924063","https://openalex.org/W3042674643","https://openalex.org/W1844055093","https://openalex.org/W61780229","https://openalex.org/W2077055222","https://openalex.org/W2973218968"],"abstract_inverted_index":{"Neural":[0],"Machine":[1],"Translation":[2],"(NMT)":[3],"is":[4,23,68],"notorious":[5],"for":[6,9,20],"its":[7],"need":[8],"large":[10],"amounts":[11],"of":[12,35,52,77,106,120],"bilingual":[13],"data.":[14],"An":[15],"effective":[16],"approach":[17,61],"to":[18,27,71,126,136],"compensate":[19],"this":[21,59,81],"requirement":[22],"Multi-Task":[24],"Learning":[25],"(MTL)":[26],"leverage":[28],"different":[29,50],"linguistic":[30],"resources":[31],"as":[32],"a":[33,93],"source":[34],"inductive":[36],"bias.":[37],"Current":[38],"MTL":[39,60],"architectures":[40],"are":[41],"based":[42],"on":[43,109],"the":[44,53,56,85,110],"SEQ2SEQ":[45],"transduction,":[46],"and":[47,67,115,128],"(partially)":[48],"share":[49],"components":[51],"models":[54],"among":[55,75],"tasks.":[57,78],"However,":[58],"often":[62],"suffers":[63],"from":[64],"task":[65,111],"interference,":[66],"not":[69],"able":[70],"fully":[72],"capture":[73],"commonalities":[74],"subsets":[76],"We":[79],"address":[80],"issue":[82],"by":[83,103],"extending":[84],"recurrent":[86],"units":[87],"with":[88,92],"multiple":[89],"blocks":[90,107],"along":[91],"trainable":[94],"routing":[95,98],"network.":[96],"The":[97],"network":[99],"enables":[100],"adaptive":[101],"collaboration":[102],"dynamic":[104],"sharing":[105],"conditioned":[108],"at":[112],"hand,":[113],"input,":[114],"model":[116],"state.":[117],"Empirical":[118],"evaluation":[119],"two":[121],"low-resource":[122],"translation":[123],"tasks,":[124],"English":[125],"Vietnamese":[127],"Farsi,":[129],"show":[130],"+1":[131],"BLEU":[132],"score":[133],"improvements":[134],"compared":[135],"strong":[137],"baselines.":[138]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":13},{"year":2019,"cited_by_count":15},{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2025-10-10T00:00:00"}
