{"id":"https://openalex.org/W4415318328","doi":"https://doi.org/10.48550/arxiv.2503.01493","title":"Sherkala-Chat: Building a State-of-the-Art LLM for Kazakh in a Moderately Resourced Setting","display_name":"Sherkala-Chat: Building a State-of-the-Art LLM for Kazakh in a Moderately Resourced Setting","publication_year":2025,"publication_date":"2025-03-03","ids":{"openalex":"https://openalex.org/W4415318328","doi":"https://doi.org/10.48550/arxiv.2503.01493"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2503.01493","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.01493","pdf_url":"https://arxiv.org/pdf/2503.01493","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.01493","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065822589","display_name":"Fajri Koto","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Koto, Fajri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108970056","display_name":"Rituraj Joshi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joshi, Rituraj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116335796","display_name":"Nurdaulet Mukhituly","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mukhituly, Nurdaulet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100631225","display_name":"Yuxia Wang","orcid":"https://orcid.org/0000-0002-6095-1030"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuxia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000261554","display_name":"Zhuohan Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Zhuohan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110171544","display_name":"R. Pal","orcid":"https://orcid.org/0009-0005-0759-3448"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pal, Rahul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000211688","display_name":"Daniil Orel","orcid":"https://orcid.org/0009-0007-5600-7032"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Orel, Daniil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106508350","display_name":"Parvez Mullah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mullah, Parvez","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075508196","display_name":"Diana Turmakhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Turmakhan, Diana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115996950","display_name":"Maiya Goloburda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goloburda, Maiya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067299517","display_name":"Muhammad Kamran","orcid":"https://orcid.org/0000-0002-2943-9098"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kamran, Mohammed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008093186","display_name":"Samujjwal Ghosh","orcid":"https://orcid.org/0000-0003-2859-7358"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghosh, Samujjwal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024941988","display_name":"Bokang Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Bokang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092029609","display_name":"Jonibek Mansurov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mansurov, Jonibek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116335795","display_name":"Mukhammed Togmanov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Togmanov, Mukhammed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036210556","display_name":"Debopriyo Banerjee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Banerjee, Debopriyo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067626011","display_name":"Nurkhan Laiyk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laiyk, Nurkhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106361399","display_name":"Akhmed Sakip","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sakip, Akhmed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058574573","display_name":"Xudong Han","orcid":"https://orcid.org/0000-0001-7961-5179"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Xudong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069779745","display_name":"Ekaterina Kochmar","orcid":"https://orcid.org/0000-0003-3328-1374"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kochmar, Ekaterina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112924039","display_name":"Alham Fikri Aji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aji, Alham Fikri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103156822","display_name":"A. J. Singh","orcid":"https://orcid.org/0009-0001-9185-6407"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Aaryamonvikram","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006526703","display_name":"Aaditya Jadhav","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jadhav, Alok Anil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092728701","display_name":"Satheesh Katipomu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Katipomu, Satheesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004502117","display_name":"Samta Kamboj","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kamboj, Samta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115653578","display_name":"Monojit Choudhury","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choudhury, Monojit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072933457","display_name":"Gurpreet Gosal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gosal, Gurpreet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120050522","display_name":"Gokulakrishnan Ramakrishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramakrishnan, Gokulakrishnan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029647878","display_name":"Biswajit Mishra","orcid":"https://orcid.org/0000-0001-6288-5383"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Biswajit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044009163","display_name":"S. C.","orcid":"https://orcid.org/0000-0001-8027-2425"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandran, Sarath","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106508351","display_name":"Avraham Sheinin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheinin, Avraham","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095886528","display_name":"Natalia Vassilieva","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vassilieva, Natalia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060274099","display_name":"Neha Sengupta","orcid":"https://orcid.org/0000-0002-0162-374X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sengupta, Neha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5012055259","display_name":"Preslav Nakov","orcid":"https://orcid.org/0000-0002-3600-1510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakov, Preslav","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":34,"corresponding_author_ids":["https://openalex.org/A5065822589"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9182000160217285,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9182000160217285,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kazakh","display_name":"Kazakh","score":0.9516000151634216},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6432999968528748},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.35580000281333923},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.3312000036239624},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.2547999918460846}],"concepts":[{"id":"https://openalex.org/C2781297163","wikidata":"https://www.wikidata.org/wiki/Q9252","display_name":"Kazakh","level":2,"score":0.9516000151634216},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6432999968528748},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5713000297546387},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.35580000281333923},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3481999933719635},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33169999718666077},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.265500009059906},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.2547999918460846},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.23890000581741333}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2503.01493","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.01493","pdf_url":"https://arxiv.org/pdf/2503.01493","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2503.01493","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.01493","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.01493","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.01493","pdf_url":"https://arxiv.org/pdf/2503.01493","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Llama-3.1-Sherkala-8B-Chat,":[0],"or":[1],"Sherkala-Chat":[2,19,37,108],"(8B)":[3,20,38,109],"for":[4,17,29,131],"short,":[5],"is":[6,39,96],"a":[7,91,116],"state-of-the-art":[8],"instruction-tuned":[9],"open":[10,66],"generative":[11],"large":[12],"language":[13],"model":[14],"(LLM)":[15],"designed":[16],"Kazakh.":[18],"aims":[21],"to":[22,125],"enhance":[23],"the":[24,34],"inclusivity":[25],"of":[26,71,119],"LLM":[27],"advancements":[28],"Kazakh":[30,67,132],"speakers.":[31,133],"Adapted":[32],"from":[33],"LLaMA-3.1-8B":[35],"model,":[36,113],"trained":[40],"on":[41],"45.3B":[42],"tokens":[43],"across":[44],"Kazakh,":[45,62],"English,":[46],"Russian,":[47],"and":[48,58,68,83,99,102,123,128],"Turkish.":[49],"With":[50],"8":[51],"billion":[52],"parameters,":[53],"it":[54],"demonstrates":[55],"strong":[56],"knowledge":[57],"reasoning":[59],"abilities":[60],"in":[61,78],"significantly":[63],"outper-forming":[64],"existing":[65],"multilingual":[69],"models":[70],"similar":[72],"scale":[73],"while":[74],"achieving":[75],"competitive":[76],"performance":[77],"English.":[79],"To":[80],"ensure":[81],"effective":[82],"responsible":[84],"alignment,":[85,122],"we":[86],"leverage":[87],"translated":[88],"instruction":[89,93],"datasets,":[90],"Kazakhstan-specific":[92],"dataset":[94],"that":[95],"automatically":[97],"constructed":[98],"manually":[100],"verified,":[101],"Kazakh-specific":[103],"safety":[104],"data.":[105],"We":[106],"release":[107],"as":[110],"an":[111],"open-weight":[112],"along":[114],"with":[115],"detailed":[117],"description":[118],"its":[120],"training,":[121],"evaluation,":[124],"support":[126],"research":[127],"real-world":[129],"applications":[130]},"counts_by_year":[],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-18T00:00:00"}
