{"id":"https://openalex.org/W7125963893","doi":"https://doi.org/10.3390/computers15020073","title":"An Integrated Approach to Adapting Open-Source AI Models for Machine Translation of Low-Resource Turkic Languages","display_name":"An Integrated Approach to Adapting Open-Source AI Models for Machine Translation of Low-Resource Turkic Languages","publication_year":2026,"publication_date":"2026-01-28","ids":{"openalex":"https://openalex.org/W7125963893","doi":"https://doi.org/10.3390/computers15020073"},"language":"en","primary_location":{"id":"doi:10.3390/computers15020073","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers15020073","pdf_url":"https://www.mdpi.com/2073-431X/15/2/73/pdf?version=1769676576","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2073-431X/15/2/73/pdf?version=1769676576","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000744340","display_name":"Ualsher Tukeyev","orcid":"https://orcid.org/0000-0001-9878-981X"},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Ualsher Tukeyev","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055611204","display_name":"Assem Shormakova","orcid":"https://orcid.org/0000-0002-1637-4643"},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":true,"raw_author_name":"Assem Shormakova","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":"https://orcid.org/0000-0002-1637-4643","affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124098631","display_name":"Aidana Karibayeva","orcid":null},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Aidana Karibayeva","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046987190","display_name":"Diana Rakhimova","orcid":"https://orcid.org/0000-0003-1427-198X"},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Diana Rakhimova","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079604919","display_name":"Balzhan Abduali","orcid":"https://orcid.org/0000-0003-0140-4181"},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Balzhan Abduali","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124058365","display_name":"Dina Amirova","orcid":null},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Dina Amirova","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124123705","display_name":"Nazym Rakhmanberdi","orcid":null},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Nazym Rakhmanberdi","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":"https://orcid.org/0009-0002-7188-4838","affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124069691","display_name":"Rashid Aliyev","orcid":null},"institutions":[{"id":"https://openalex.org/I185571130","display_name":"Al-Farabi Kazakh National University","ror":"https://ror.org/03q0vrn42","country_code":"KZ","type":"education","lineage":["https://openalex.org/I185571130"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Rashid Aliyev","raw_affiliation_strings":["Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology and Artificial Intelligence, Farabi University, Almaty 050040, Kazakhstan","institution_ids":["https://openalex.org/I185571130"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5055611204"],"corresponding_institution_ids":["https://openalex.org/I185571130"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16248047,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"15","issue":"2","first_page":"73","last_page":"73"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9128000140190125,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9128000140190125,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.006099999882280827,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.003800000064074993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.8389999866485596},{"id":"https://openalex.org/keywords/parallel-corpora","display_name":"Parallel corpora","score":0.6628000140190125},{"id":"https://openalex.org/keywords/bleu","display_name":"BLEU","score":0.6431999802589417},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.40689998865127563},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.3833000063896179},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.35040000081062317}],"concepts":[{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.8389999866485596},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.78329998254776},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6912999749183655},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6797000169754028},{"id":"https://openalex.org/C2985367798","wikidata":"https://www.wikidata.org/wiki/Q1346592","display_name":"Parallel corpora","level":3,"score":0.6628000140190125},{"id":"https://openalex.org/C622187","wikidata":"https://www.wikidata.org/wiki/Q3500773","display_name":"BLEU","level":3,"score":0.6431999802589417},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.40689998865127563},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.3833000063896179},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C2986258472","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation system","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25360000133514404}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/computers15020073","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers15020073","pdf_url":"https://www.mdpi.com/2073-431X/15/2/73/pdf?version=1769676576","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:a0cda0457e1f40a3aef10be8343b91da","is_oa":false,"landing_page_url":"https://doaj.org/article/a0cda0457e1f40a3aef10be8343b91da","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers, Vol 15, Iss 2, p 73 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/computers15020073","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers15020073","pdf_url":"https://www.mdpi.com/2073-431X/15/2/73/pdf?version=1769676576","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7125963893.pdf","grobid_xml":"https://content.openalex.org/works/W7125963893.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,29,99],"study":[1],"presents":[2],"the":[3,82,191,197,201,230,242,262,276,295,300,317],"application":[4],"of":[5,38,84,128,183,193,233,244,272,278,290,308],"free,":[6],"open-source":[7,86],"artificial":[8],"intelligence":[9],"(AI)":[10],"techniques":[11],"to":[12,41,49,69,77,240],"advance":[13],"machine":[14,30,61,245,291],"translation":[15,31,62,246,292],"for":[16,33,57,73,93,105,123,139,203,247,281],"low-resource":[17,248],"Turkic":[18,34,97,107,249],"languages":[19,35,75,250],"such":[20],"as":[21],"Kazakh,":[22],"Azerbaijani,":[23],"Kyrgyz,":[24],"Turkish,":[25],"Turkmen,":[26],"and":[27,53,76,89,110,117,130,135,164,166,171,176,190,217,219,224,236,266,293,313,322],"Uzbek.":[28],"problem":[32],"is":[36,68,275],"part":[37],"a":[39,279,286],"project":[40],"generate":[42],"meeting":[43],"minutes":[44],"from":[45],"speech":[46],"transcripts.":[47],"Due":[48],"limited":[50],"parallel":[51,103,121,142,181,283,306],"corpora":[52,104,122,140,182,284,307],"underdeveloped":[54],"linguistic":[55],"tools":[56],"these":[58,74],"languages,":[59,108,126],"traditional":[60],"approaches":[63],"often":[64],"underperform.":[65],"The":[66,120,137,269],"goal":[67],"reduce":[70],"digital":[71],"inequality":[72],"support":[78],"scalability.":[79],"We":[80],"investigate":[81],"effectiveness":[83],"free":[85],"pre-trained":[87],"specialized":[88,287,296],"general-purpose":[90],"AI":[91,252,288,297],"models":[92],"morphologically":[94],"rich":[95],"state":[96],"languages.":[98],"research":[100],"includes":[101],"developing":[102],"six":[106],"fine-tuning,":[109],"performance":[111],"evaluation":[112,260],"using":[113,251,285,316],"BLEU,":[114],"WER,":[115],"TER,":[116],"chrF":[118,159,212],"metrics.":[119],"five":[124],"pair":[125],"each":[127],"300,000":[129],"500,000":[131,141,204],"sentences,":[132],"were":[133,188,256],"generated":[134],"cleaned.":[136],"results":[138,202,228,255],"sentences":[143,187],"show":[144],"significant":[145],"improvements":[146],"compared":[147,199],"with":[148,200],"baseline":[149],"NLLB-200":[150,194],"1.3B":[151,195],"on":[152,261,299],"average:":[153],"BLEU":[154,207],"increased":[155,160,208,213],"by":[156,161,169,209,214,222,258],"23.81":[157],"points,":[158,163,211,216],"26.05":[162],"WER":[165,218],"TER":[167,220],"decreased":[168,221],"0.36":[170],"33.95,":[172],"respectively,":[173],"after":[174],"cleaning":[175,235,320],"fine-tuning.":[177],"Six":[178],"Turkic-language":[179],"multilingual":[180,305],"3":[184],"885":[185],"542":[186],"developed":[189],"fine-tuning":[192,294,324],"shows":[196],"following,":[198],"cleaned":[205],"corpus:":[206],"4.3":[210],"1.7":[215],"0.1":[223],"4.75,":[225],"respectively":[226],"These":[227,254],"demonstrate":[229],"high":[231],"efficiency":[232],"corpus":[234],"synthetic":[237],"data":[238],"generation":[239],"improve":[241],"quality":[243],"models.":[253],"confirmed":[257],"external":[259],"FLORES":[263],"200":[264],"dataset":[265],"human":[267],"evaluation.":[268],"scientific":[270],"contribution":[271],"this":[273],"article":[274],"development":[277],"methodology":[280],"generating":[282],"model":[289,298],"created":[301],"corpora,":[302],"creating":[303],"new":[304],"Azerbaijan\u2013Kazakh,":[309],"Kyrgyz\u2013Kazakh,":[310],"Turkish\u2013Kazakh,":[311],"Turkmen\u2013Kazakh,":[312],"Uzbek\u2013Kazakh":[314],"pairs":[315],"proposed":[318],"methodology,":[319],"them,":[321],"conducting":[323],"experiments.":[325]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2026-01-29T00:00:00"}
