{"id":"https://openalex.org/W7133313321","doi":"https://doi.org/10.48550/arxiv.2603.01691","title":"Building a Strong Instruction Language Model for a Less-Resourced Language","display_name":"Building a Strong Instruction Language Model for a Less-Resourced Language","publication_year":2026,"publication_date":"2026-03-02","ids":{"openalex":"https://openalex.org/W7133313321","doi":"https://doi.org/10.48550/arxiv.2603.01691"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01691","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013906492","display_name":"Domen Vre\u0161","orcid":"https://orcid.org/0000-0002-9225-2699"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Vre\u0161, Domen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127926483","display_name":"Tja\u0161a Ar\u010don","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ar\u010don, Tja\u0161a","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116063423","display_name":"Timotej Petri\u010d","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Petri\u010d, Timotej","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120318249","display_name":"Dario Vajda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vajda, Dario","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127918983","display_name":"Marko Robnik-\u0160ikonja","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robnik-\u0160ikonja, Marko","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5010861913","display_name":"Iztok Lebar Bajec","orcid":"https://orcid.org/0000-0003-4722-6712"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bajec, Iztok Lebar","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5013906492"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2045000046491623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2045000046491623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.19779999554157257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.11180000007152557,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6858000159263611},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5231999754905701},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4925000071525574},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.42980000376701355},{"id":"https://openalex.org/keywords/constructed-language","display_name":"Constructed language","score":0.42820000648498535},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4007999897003174}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7605999708175659},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6858000159263611},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5670999884605408},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.551800012588501},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5231999754905701},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4925000071525574},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4332999885082245},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.42980000376701355},{"id":"https://openalex.org/C94922259","wikidata":"https://www.wikidata.org/wiki/Q33215","display_name":"Constructed language","level":2,"score":0.42820000648498535},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4007999897003174},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.39329999685287476},{"id":"https://openalex.org/C74672266","wikidata":"https://www.wikidata.org/wiki/Q815859","display_name":"Language acquisition","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.2856999933719635},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.26930001378059387}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.43503105640411377}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1,11,96],"models":[2,20],"(LLMs)":[3],"have":[4],"become":[5],"an":[6,49],"essential":[7],"tool":[8],"for":[9,44,68,83],"natural":[10],"processing":[12],"and":[13,34,55,74,125,129,134,147,166],"artificial":[14],"intelligence":[15],"in":[16,28,174],"general.":[17],"Current":[18],"open-source":[19,81],"are":[21],"primarily":[22],"trained":[23,113],"on":[24,31,116,141],"English":[25,133],"texts,":[26],"resulting":[27],"poorer":[29],"performance":[30],"less-resourced":[32,53],"languages":[33],"cultures.":[35],"We":[36,62,89,112,138,152],"present":[37,63],"a":[38,52,65,117,180],"set":[39],"of":[40,48,101,119,183],"methodological":[41],"approaches":[42],"necessary":[43],"the":[45,59,79,91,94,102,114,142,148,155,175],"successful":[46],"adaptation":[47],"LLM":[50,150,177],"to":[51,93,169],"language,":[54],"demonstrate":[56,75],"them":[57],"using":[58,97],"Slovene":[60,69,84,95,135,149,176],"language.":[61],"GaMS3-12B,":[64],"generative":[66],"model":[67,82,92,115,157],"with":[70],"12":[71],"billion":[72],"parameters,":[73],"that":[76,154],"it":[77],"is":[78],"best-performing":[80],"within":[85],"its":[86],"parameter":[87],"range.":[88],"adapted":[90],"three-stage":[98],"continual":[99],"pre-training":[100],"Gemma":[103,160],"3":[104,161],"model,":[105],"followed":[106],"by":[107],"two-stage":[108],"supervised":[109],"fine-tuning":[110],"(SFT).":[111],"combination":[118],"140B":[120],"Slovene,":[121],"English,":[122],"Bosnian,":[123],"Serbian,":[124],"Croatian":[126],"pretraining":[127],"tokens,":[128],"over":[130,184],"200":[131],"thousand":[132],"SFT":[136],"examples.":[137],"evaluate":[139],"GaMS3-12B":[140],"Slovenian-LLM-Eval":[143],"datasets,":[144],"English-to-Slovene":[145],"translation,":[146],"arena.":[151],"show":[153],"described":[156],"outperforms":[158],"12B":[159],"across":[162],"all":[163],"three":[164],"scenarios":[165],"performs":[167],"comparably":[168],"much":[170],"larger":[171],"commercial":[172],"GPT-4o":[173],"arena,":[178],"achieving":[179],"win":[181],"rate":[182],"60":[185],"%.":[186]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
