{"id":"https://openalex.org/W4285077564","doi":"https://doi.org/10.48550/arxiv.2207.04672","title":"No Language Left Behind: Scaling Human-Centered Machine Translation","display_name":"No Language Left Behind: Scaling Human-Centered Machine Translation","publication_year":2022,"publication_date":"2022-07-11","ids":{"openalex":"https://openalex.org/W4285077564","doi":"https://doi.org/10.48550/arxiv.2207.04672"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2207.04672","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.04672","pdf_url":"https://arxiv.org/pdf/2207.04672","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2207.04672","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011813864","display_name":"Nllb Team","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"NLLB Team","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074210163","display_name":"Marta R. Costa\u2010juss\u00e0","orcid":"https://orcid.org/0000-0002-5703-520X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Costa-juss\u00e0, Marta R.","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101916721","display_name":"James H. Cross","orcid":"https://orcid.org/0009-0007-1347-1740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cross, James","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055056487","display_name":"Onur \u00c7elebi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u00c7elebi, Onur","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005764737","display_name":"Maha Elbayad","orcid":"https://orcid.org/0000-0002-8389-231X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elbayad, Maha","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070589644","display_name":"Kenneth Heafield","orcid":"https://orcid.org/0000-0002-6344-9927"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heafield, Kenneth","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059012246","display_name":"Kevin S. Heffernan","orcid":"https://orcid.org/0000-0002-3499-1477"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heffernan, Kevin","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023818527","display_name":"Elahe Kalbassi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kalbassi, Elahe","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054317026","display_name":"Janice Lam","orcid":"https://orcid.org/0000-0001-5167-3799"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lam, Janice","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056885320","display_name":"Daniel J. Licht","orcid":"https://orcid.org/0000-0002-4080-843X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Licht, Daniel","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104441926","display_name":"Jean Maillard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maillard, Jean","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029985197","display_name":"Anna Sun","orcid":"https://orcid.org/0009-0007-6467-0563"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Anna","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051093305","display_name":"Skyler Wang","orcid":"https://orcid.org/0000-0002-0639-945X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Skyler","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023203387","display_name":"Guillaume Wenzek","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wenzek, Guillaume","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047396415","display_name":"Al Youngblood","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Youngblood, Al","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037594716","display_name":"Bapi Akula","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akula, Bapi","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043289060","display_name":"Lo\u00efc Barrault","orcid":"https://orcid.org/0000-0002-0634-6147"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barrault, Loic","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035598726","display_name":"Gabriel Mejia Gonzalez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gonzalez, Gabriel Mejia","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029804928","display_name":"Prangthip Hansanti","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hansanti, Prangthip","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109346484","display_name":"John P. Hoffman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoffman, John","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032320234","display_name":"Semarley Jarrett","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jarrett, Semarley","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023501975","display_name":"Kaushik Ram Sadagopan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sadagopan, Kaushik Ram","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027709388","display_name":"Dirk Rowe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rowe, Dirk","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047118262","display_name":"Shannon Spruit","orcid":"https://orcid.org/0000-0001-9252-5741"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spruit, Shannon","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102020669","display_name":"Chau Tran","orcid":"https://orcid.org/0009-0001-1338-3982"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tran, Chau","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091619219","display_name":"Pierre Andrews","orcid":"https://orcid.org/0000-0001-6780-7798"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andrews, Pierre","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062598662","display_name":"Necip Faz\u0131l Ayan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ayan, Necip Fazil","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065321401","display_name":"Shruti Bhosale","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhosale, Shruti","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016113002","display_name":"Sergey Edunov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Edunov, Sergey","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103230346","display_name":"Angela Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Angela","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024347376","display_name":"Cynthia Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Cynthia","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035752789","display_name":"Vedanuj Goswami","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goswami, Vedanuj","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113551755","display_name":"Francisco Guzm\u00e1n","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guzm\u00e1n, Francisco","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112315093","display_name":"Philipp Koehn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koehn, Philipp","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010669494","display_name":"Alexandre Mourachko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mourachko, Alexandre","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030185276","display_name":"Christophe Ropers","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ropers, Christophe","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033648476","display_name":"Safiyyah Saleem","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saleem, Safiyyah","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015857371","display_name":"Holger Schwenk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwenk, Holger","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061222029","display_name":"Jeff Wang","orcid":"https://orcid.org/0000-0001-9923-1068"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jeff","raw_affiliation_strings":["NLLB Team"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NLLB Team","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":39,"corresponding_author_ids":["https://openalex.org/A5011813864"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":362,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9674999713897705,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.907800018787384,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7847155332565308},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7779359221458435},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.5975189208984375},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5814959406852722},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5481919050216675},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5370188355445862},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.5245347619056702},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4428386092185974},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4370438754558563},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.39588478207588196},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36109277606010437},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.12548139691352844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7847155332565308},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7779359221458435},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.5975189208984375},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5814959406852722},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5481919050216675},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5370188355445862},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.5245347619056702},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4428386092185974},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4370438754558563},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39588478207588196},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36109277606010437},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.12548139691352844},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2207.04672","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.04672","pdf_url":"https://arxiv.org/pdf/2207.04672","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2207.04672","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2207.04672","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2207.04672","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2207.04672","pdf_url":"https://arxiv.org/pdf/2207.04672","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W1574414179","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4297676672","https://openalex.org/W4281702477","https://openalex.org/W2490526372","https://openalex.org/W4376166922","https://openalex.org/W4378510483","https://openalex.org/W4221142204"],"abstract_inverted_index":{"Driven":[0],"by":[1,79],"the":[2,39,52,82,104,163,204],"goal":[3],"of":[4,21,35,42,125,158,165,199],"eradicating":[5],"language":[6,54,86],"barriers":[7],"on":[8,76,121,130,156],"a":[9,18,32,116,172,181,212],"global":[10],"scale,":[11],"machine":[12],"translation":[13,87,169,192,214],"has":[14],"solidified":[15],"itself":[16],"as":[17],"key":[19],"focus":[20],"artificial":[22],"intelligence":[23],"research":[24],"today.":[25],"However,":[26],"such":[27],"efforts":[28],"have":[29],"coalesced":[30],"around":[31],"small":[33],"subset":[34],"languages,":[36],"leaving":[37],"behind":[38],"vast":[40],"majority":[41],"mostly":[43],"low-resource":[44,85,142],"languages.":[45,111,143],"What":[46],"does":[47],"it":[48],"take":[49],"to":[50,151,190,203],"break":[51],"200":[53],"barrier":[55],"while":[56,63,154],"ensuring":[57],"safe,":[58],"high":[59],"quality":[60],"results,":[61],"all":[62,186,220],"keeping":[64],"ethical":[65],"considerations":[66],"in":[67,188,223],"mind?":[68],"In":[69],"No":[70],"Language":[71],"Left":[72],"Behind,":[73],"we":[74,96,114,161,217],"took":[75],"this":[77,224],"challenge":[78],"first":[80],"contextualizing":[81],"need":[83],"for":[84,141],"support":[88],"through":[89],"exploratory":[90],"interviews":[91],"with":[92,133,180],"native":[93],"speakers.":[94],"Then,":[95],"created":[97],"datasets":[98],"and":[99,109,135,148,176],"models":[100],"aimed":[101],"at":[102,227],"narrowing":[103],"performance":[105,164],"gap":[106],"between":[107],"low":[108],"high-resource":[110],"More":[112],"specifically,":[113],"developed":[115],"conditional":[117],"compute":[118],"model":[119,195],"based":[120],"Sparsely":[122],"Gated":[123],"Mixture":[124],"Experts":[126],"that":[127],"is":[128],"trained":[129],"data":[131,137],"obtained":[132],"novel":[134,182],"effective":[136],"mining":[138],"techniques":[139],"tailored":[140],"We":[144],"propose":[145],"multiple":[146],"architectural":[147],"training":[149,155],"improvements":[150],"counteract":[152],"overfitting":[153],"thousands":[157],"tasks.":[159],"Critically,":[160],"evaluated":[162],"over":[166],"40,000":[167],"different":[168],"directions":[170],"using":[171],"human-translated":[173],"benchmark,":[174],"Flores-200,":[175],"combined":[177],"human":[178],"evaluation":[179],"toxicity":[183],"benchmark":[184],"covering":[185],"languages":[187],"Flores-200":[189],"assess":[191],"safety.":[193],"Our":[194],"achieves":[196],"an":[197],"improvement":[198],"44%":[200],"BLEU":[201],"relative":[202],"previous":[205],"state-of-the-art,":[206],"laying":[207],"important":[208],"groundwork":[209],"towards":[210],"realizing":[211],"universal":[213],"system.":[215],"Finally,":[216],"open":[218],"source":[219],"contributions":[221],"described":[222],"work,":[225],"accessible":[226],"https://github.com/facebookresearch/fairseq/tree/nllb.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":48},{"year":2024,"cited_by_count":81},{"year":2023,"cited_by_count":210},{"year":2022,"cited_by_count":15},{"year":2020,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
