{"id":"https://openalex.org/W2886342729","doi":"https://doi.org/10.18653/v1/w18-2705","title":"Regularized Training Objective for Continued Training for Domain Adaptation in Neural Machine Translation","display_name":"Regularized Training Objective for Continued Training for Domain Adaptation in Neural Machine Translation","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2886342729","doi":"https://doi.org/10.18653/v1/w18-2705","mag":"2886342729"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w18-2705","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-2705","pdf_url":"https://www.aclweb.org/anthology/W18-2705.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Neural Machine Translation and Generation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W18-2705.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080544452","display_name":"Huda Khayrallah","orcid":"https://orcid.org/0000-0002-2920-6745"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Huda Khayrallah","raw_affiliation_strings":["Department of Computer Science Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105836462","display_name":"Brian J. Thompson","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian Thompson","raw_affiliation_strings":["Department of Computer Science Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070418792","display_name":"Kevin Duh","orcid":"https://orcid.org/0000-0001-8107-4383"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kevin Duh","raw_affiliation_strings":["Department of Computer Science Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112315093","display_name":"Philipp Koehn","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Philipp Koehn","raw_affiliation_strings":["Department of Computer Science Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5080544452"],"corresponding_institution_ids":["https://openalex.org/I145311948"],"apc_list":null,"apc_paid":null,"fwci":10.1543,"has_fulltext":true,"cited_by_count":78,"citation_normalized_percentile":{"value":0.98433205,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7839221954345703},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7569708824157715},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.7541093230247498},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6770931482315063},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.6389415264129639},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5669766664505005},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5340797901153564},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5201583504676819},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4434697926044464},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4217611253261566},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4141498804092407},{"id":"https://openalex.org/keywords/cross-entropy","display_name":"Cross entropy","score":0.4105619490146637},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3781708776950836},{"id":"https://openalex.org/keywords/principle-of-maximum-entropy","display_name":"Principle of maximum entropy","score":0.3527919054031372},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11142149567604065}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7839221954345703},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7569708824157715},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.7541093230247498},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6770931482315063},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.6389415264129639},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5669766664505005},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5340797901153564},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5201583504676819},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4434697926044464},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4217611253261566},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4141498804092407},{"id":"https://openalex.org/C167981619","wikidata":"https://www.wikidata.org/wiki/Q1685498","display_name":"Cross entropy","level":3,"score":0.4105619490146637},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3781708776950836},{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.3527919054031372},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11142149567604065},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.18653/v1/w18-2705","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-2705","pdf_url":"https://www.aclweb.org/anthology/W18-2705.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Neural Machine Translation and Generation","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:publications/9358b6e3-a52c-4738-919e-3e1db80e8a04","is_oa":true,"landing_page_url":null,"pdf_url":"https://www.research.ed.ac.uk/en/publications/9358b6e3-a52c-4738-919e-3e1db80e8a04","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:pure.ed.ac.uk:publications/9358b6e3-a52c-4738-919e-3e1db80e8a04","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/9358b6e3-a52c-4738-919e-3e1db80e8a04","pdf_url":"https://www.research.ed.ac.uk/en/publications/9358b6e3-a52c-4738-919e-3e1db80e8a04","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Khayrallah, H, Thompson, B, Duh, K & Koehn, P 2018, Regularized Training Objective for Continued Training for Domain Adaptation in Neural Machine Translation. in Proceedings of the 2nd Workshop on Neural Machine Translation and Generation . Melbourne, Australia , pp. 36-44, 2nd Workshop on Neural Machine Translation and Generation, Melbourne, Victoria, Australia, 15/07/18. < http://aclweb.org/anthology/W18-2705 >","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"doi:10.18653/v1/w18-2705","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-2705","pdf_url":"https://www.aclweb.org/anthology/W18-2705.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Neural Machine Translation and Generation","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3429874898","display_name":null,"funder_award_id":"LORELEI","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G4823715754","display_name":null,"funder_award_id":"NDSEG","funder_id":"https://openalex.org/F4320306078","funder_display_name":"U.S. Department of Defense"},{"id":"https://openalex.org/G7320824963","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306078","funder_display_name":"U.S. Department of Defense"},{"id":"https://openalex.org/G8926491534","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320333566","funder_display_name":"National Defense Science and Engineering Graduate"}],"funders":[{"id":"https://openalex.org/F4320306078","display_name":"U.S. Department of Defense","ror":"https://ror.org/0447fe631"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320333566","display_name":"National Defense Science and Engineering Graduate","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2886342729.pdf","grobid_xml":"https://content.openalex.org/works/W2886342729.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W22168010","https://openalex.org/W630532510","https://openalex.org/W635530177","https://openalex.org/W1989549063","https://openalex.org/W2100495367","https://openalex.org/W2113839990","https://openalex.org/W2133564696","https://openalex.org/W2183341477","https://openalex.org/W2184135559","https://openalex.org/W2525778437","https://openalex.org/W2527845440","https://openalex.org/W2537667581","https://openalex.org/W2560647685","https://openalex.org/W2567571499","https://openalex.org/W2581377246","https://openalex.org/W2744813330","https://openalex.org/W2757291580","https://openalex.org/W2760656271","https://openalex.org/W2782917850","https://openalex.org/W2903193068","https://openalex.org/W2962784628","https://openalex.org/W2962863357","https://openalex.org/W2962867687","https://openalex.org/W2963212250","https://openalex.org/W2963403868","https://openalex.org/W2963506925","https://openalex.org/W2963736842","https://openalex.org/W2964067969","https://openalex.org/W2964308564","https://openalex.org/W3204406378","https://openalex.org/W4297798436","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W3011059803","https://openalex.org/W3151736118","https://openalex.org/W2756978580","https://openalex.org/W2577063019","https://openalex.org/W2154124206","https://openalex.org/W2972060578","https://openalex.org/W4285877427","https://openalex.org/W783305165","https://openalex.org/W2531741693","https://openalex.org/W4385386361"],"abstract_inverted_index":{"Supervised":[0],"domain":[1,114],"adaptation-where":[2],"a":[3,8,17,29,37,112],"large":[4],"generic":[5,30],"corpus":[6,11],"and":[7,32,78,106],"smaller":[9],"indomain":[10,73],"are":[12],"both":[13],"available":[14],"for":[15,19],"training-is":[16],"challenge":[18],"neural":[20],"machine":[21],"translation":[22],"(NMT).":[23],"Standard":[24],"practice":[25],"is":[26],"to":[27,35,49,59,84,127],"train":[28],"model":[31,45,83],"use":[33],"it":[34],"initialize":[36],"second":[38,44],"model,":[39],"then":[40],"continue":[41],"training":[42,61,65,124],"the":[43,60,68,72,81,86,94],"on":[46,101],"in-domain":[47,52],"data":[48],"produce":[50],"an":[51,56],"model.":[53,97,116],"We":[54,98],"add":[55],"auxiliary":[57],"term":[58],"objective":[62],"during":[63],"continued":[64,123],"that":[66,79],"minimizes":[67],"cross":[69],"entropy":[70],"between":[71],"model's":[74,87],"output":[75,88],"word":[76],"distribution":[77],"of":[80,104],"out-of-domain":[82],"prevent":[85],"from":[89,93,111],"differing":[90],"too":[91],"much":[92],"original":[95],"out-ofdomain":[96],"perform":[99],"experiments":[100],"EMEA":[102],"(descriptions":[103],"medicines)":[105],"TED":[107],"(rehearsed":[108],"presentations),":[109],"initialized":[110],"general":[113],"(WMT)":[115],"Our":[117],"method":[118],"shows":[119],"improvements":[120],"over":[121],"standard":[122],"by":[125],"up":[126],"1.5":[128],"BLEU.":[129]},"counts_by_year":[{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":32},{"year":2019,"cited_by_count":14},{"year":2018,"cited_by_count":4}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
