{"id":"https://openalex.org/W4293304020","doi":"https://doi.org/10.48550/arxiv.2205.02022","title":"A Few Thousand Translations Go a Long Way! Leveraging Pre-trained Models for African News Translation","display_name":"A Few Thousand Translations Go a Long Way! Leveraging Pre-trained Models for African News Translation","publication_year":2022,"publication_date":"2022-05-04","ids":{"openalex":"https://openalex.org/W4293304020","doi":"https://doi.org/10.48550/arxiv.2205.02022"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2205.02022","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.02022","pdf_url":"https://arxiv.org/pdf/2205.02022","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2205.02022","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088658365","display_name":"David Ifeoluwa Adelani","orcid":"https://orcid.org/0000-0002-0193-2083"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adelani, David Ifeoluwa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022193863","display_name":"Jesujoba Oluwadara Alabi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alabi, Jesujoba Oluwadara","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103230346","display_name":"Angela Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Angela","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048307591","display_name":"Julia Kreutzer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kreutzer, Julia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103000631","display_name":"Xiaoyu Shen","orcid":"https://orcid.org/0000-0002-0217-2469"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xiaoyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073571802","display_name":"Machel Reid","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reid, Machel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037261355","display_name":"Dana Ruiter","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruiter, Dana","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008875255","display_name":"Dietrich Klakow","orcid":"https://orcid.org/0000-0002-4147-9690"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klakow, Dietrich","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005950162","display_name":"Peter Nabende","orcid":"https://orcid.org/0000-0003-2141-7940"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nabende, Peter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021305048","display_name":"Ernie Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Ernie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056428478","display_name":"Tajuddeen Gwadabe","orcid":"https://orcid.org/0000-0002-3901-1589"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gwadabe, Tajuddeen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083467612","display_name":"Freshia Sackey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sackey, Freshia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058219704","display_name":"Bonaventure F. P. Dossou","orcid":"https://orcid.org/0000-0002-0519-1761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dossou, Bonaventure F. P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043359753","display_name":"Chris Chinenye Emezue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Emezue, Chris Chinenye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028704705","display_name":"Colin Leong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Leong, Colin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091348511","display_name":"Michael Beukman","orcid":"https://orcid.org/0000-0002-5468-284X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beukman, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002849148","display_name":"Shamsuddeen Hassan Muhammad","orcid":"https://orcid.org/0000-0001-7708-0799"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muhammad, Shamsuddeen Hassan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063122505","display_name":"Guyo Jarso","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jarso, Guyo Dub","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043203940","display_name":"Oreen Yousuf","orcid":"https://orcid.org/0009-0000-3320-813X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yousuf, Oreen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024826347","display_name":"Andre Niyongabo Rubungo","orcid":"https://orcid.org/0000-0003-3608-2039"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rubungo, Andre Niyongabo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029414679","display_name":"Gilles Hacheme","orcid":"https://orcid.org/0000-0002-9465-6558"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hacheme, Gilles","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001287329","display_name":"Eric Peter Wairagala","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wairagala, Eric Peter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027180951","display_name":"Muhammad Umair Nasir","orcid":"https://orcid.org/0000-0002-2458-9599"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nasir, Muhammad Umair","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013671910","display_name":"Benjamin A. Ajibade","orcid":"https://orcid.org/0000-0001-9073-948X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ajibade, Benjamin Ayoade","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086490002","display_name":"Tunde Oluwaseyi Ajayi","orcid":"https://orcid.org/0000-0002-1860-609X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ajayi, Tunde Oluwaseyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090214735","display_name":"Yvonne Gitau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gitau, Yvonne Wambui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087385370","display_name":"Jade Abbott","orcid":"https://orcid.org/0000-0001-6061-0888"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abbott, Jade","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103897560","display_name":"Mohamed Ahmed","orcid":"https://orcid.org/0009-0009-2646-4739"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed, Mohamed","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089451523","display_name":"Millicent Ochieng","orcid":"https://orcid.org/0000-0003-4769-7039"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ochieng, Millicent","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076526073","display_name":"Anuoluwapo Aremu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aremu, Anuoluwapo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045030523","display_name":"Perez Ogayo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ogayo, Perez","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011303143","display_name":"Jonathan Mukiibi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mukiibi, Jonathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049751102","display_name":"Fatoumata Ouoba Kabore","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kabore, Fatoumata Ouoba","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042051097","display_name":"Godson Koffi Kalipe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kalipe, Godson Koffi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058329063","display_name":"Dergu\u00e8ne Mbaye","orcid":"https://orcid.org/0000-0002-7490-2731"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mbaye, Derguene","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075701052","display_name":"Allahsera Auguste Tapo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tapo, Allahsera Auguste","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001521070","display_name":"Victoire Memdjokam Koagne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koagne, Victoire Memdjokam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009464697","display_name":"Edwin Munkoh-Buabeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Munkoh-Buabeng, Edwin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057889568","display_name":"Valencia Wagner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wagner, Valencia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054346112","display_name":"Idris Abdulmumin","orcid":"https://orcid.org/0000-0002-3795-8381"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdulmumin, Idris","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089329850","display_name":"Ayodele Awokoya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Awokoya, Ayodele","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029705069","display_name":"Happy Buzaaba","orcid":"https://orcid.org/0000-0001-7985-3396"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Buzaaba, Happy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044121206","display_name":"Blessing Sibanda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sibanda, Blessing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004241641","display_name":"Andiswa Bukula","orcid":"https://orcid.org/0000-0002-6667-4599"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bukula, Andiswa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084616817","display_name":"Sam Manthalu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manthalu, Sam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":45,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9830999970436096,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8241292238235474},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.8119921684265137},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5867383480072021},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5831868648529053},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5315228700637817},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.48635369539260864},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4852873980998993},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.46317344903945923},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4156959354877472},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.41079485416412354}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8241292238235474},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.8119921684265137},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5867383480072021},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5831868648529053},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5315228700637817},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.48635369539260864},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4852873980998993},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.46317344903945923},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4156959354877472},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.41079485416412354},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2205.02022","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.02022","pdf_url":"https://arxiv.org/pdf/2205.02022","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2205.02022","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2205.02022","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2205.02022","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.02022","pdf_url":"https://arxiv.org/pdf/2205.02022","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3011059803","https://openalex.org/W3151736118","https://openalex.org/W2012531322","https://openalex.org/W2898767136","https://openalex.org/W2972060578","https://openalex.org/W4285877427","https://openalex.org/W783305165","https://openalex.org/W4287644835","https://openalex.org/W3092281475","https://openalex.org/W3098003361"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,22,103],"the":[3,38,44,60,104,111,149],"pre-training":[4],"of":[5,54,62,134,141,172],"language":[6],"models":[7,56,77,96,114,168],"leverage":[8,74],"large-scale":[9,45],"datasets":[10],"to":[11,48,59,72,78,117,156,160,164],"create":[12,49,79,125],"multilingual":[13],"models.":[14],"However,":[15],"low-resource":[16,80],"languages":[17,32,63,100,137,158],"are":[18,33,57,138],"mostly":[19],"left":[20],"out":[21],"these":[23,55,122],"datasets.":[24,50],"This":[25,68],"is":[26,163],"primarily":[27],"because":[28],"many":[29],"widely":[30],"spoken":[31],"not":[34,101,139],"well":[35],"represented":[36],"on":[37,89,169],"web":[39],"and":[40,107,159],"therefore":[41],"excluded":[42],"from":[43],"crawls":[46],"used":[47,98],"Furthermore,":[51],"downstream":[52],"users":[53],"restricted":[58],"selection":[61],"originally":[64],"chosen":[65],"for":[66,83,99,153],"pre-training.":[67],"work":[69],"investigates":[70],"how":[71],"optimally":[73],"existing":[75,143],"pre-trained":[76,95,167],"translation":[81,113,174],"systems":[82],"16":[84,132],"African":[85,128],"languages.":[86],"We":[87,146],"focus":[88],"two":[90],"questions:":[91],"1)":[92],"How":[93,109],"can":[94,110],"be":[97],"included":[102],"initial":[105],"pre-training?":[106],"2)":[108],"resulting":[112],"effectively":[115],"transfer":[116],"new":[118,127],"domains?":[119],"To":[120],"answer":[121],"questions,":[123],"we":[124],"a":[126],"news":[129],"corpus":[130],"covering":[131],"languages,":[133],"which":[135],"eight":[136],"part":[140],"any":[142],"evaluation":[144],"dataset.":[145],"demonstrate":[147],"that":[148],"most":[150],"effective":[151],"strategy":[152],"transferring":[154],"both":[155],"additional":[157,161],"domains":[162],"fine-tune":[165],"large":[166],"small":[170],"quantities":[171],"high-quality":[173],"data.":[175]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2022-08-27T00:00:00"}
