{"id":"https://openalex.org/W4283655116","doi":"https://doi.org/10.23919/mipro55190.2022.9803646","title":"NLP-based Typo Correction Model for Croatian Language","display_name":"NLP-based Typo Correction Model for Croatian Language","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4283655116","doi":"https://doi.org/10.23919/mipro55190.2022.9803646"},"language":"en","primary_location":{"id":"doi:10.23919/mipro55190.2022.9803646","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mipro55190.2022.9803646","pdf_url":null,"source":{"id":"https://openalex.org/S4363605136","display_name":"2022 45th Jubilee International Convention on Information, Communication and Electronic Technology (MIPRO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 45th Jubilee International Convention on Information, Communication and Electronic Technology (MIPRO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073829001","display_name":"Maja Mitreska","orcid":null},"institutions":[{"id":"https://openalex.org/I174143326","display_name":"Macedonian Academy of Sciences and Arts","ror":"https://ror.org/003jsdw96","country_code":"MK","type":"education","lineage":["https://openalex.org/I174143326"]}],"countries":["MK"],"is_corresponding":true,"raw_author_name":"Maja Mitreska","raw_affiliation_strings":["iReason, LLC,Skopje,N. Macedonia","iReason, LLC, Skopje, N. Macedonia"],"affiliations":[{"raw_affiliation_string":"iReason, LLC,Skopje,N. Macedonia","institution_ids":["https://openalex.org/I174143326"]},{"raw_affiliation_string":"iReason, LLC, Skopje, N. Macedonia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084784960","display_name":"Kostadin Mishev","orcid":"https://orcid.org/0000-0003-3982-3330"},"institutions":[{"id":"https://openalex.org/I174143326","display_name":"Macedonian Academy of Sciences and Arts","ror":"https://ror.org/003jsdw96","country_code":"MK","type":"education","lineage":["https://openalex.org/I174143326"]},{"id":"https://openalex.org/I76245029","display_name":"Saints Cyril and Methodius University of Skopje","ror":"https://ror.org/02wk2vx54","country_code":"MK","type":"education","lineage":["https://openalex.org/I76245029"]}],"countries":["MK"],"is_corresponding":false,"raw_author_name":"Kostadin Mishev","raw_affiliation_strings":["iReason, LLC,Skopje,N. Macedonia","iReason, LLC, Skopje, N. Macedonia","Faculty of Computer Science and Engineering, Ss. Cyril and Methodius University, Skopje, N. Macedonia"],"affiliations":[{"raw_affiliation_string":"iReason, LLC,Skopje,N. Macedonia","institution_ids":["https://openalex.org/I174143326"]},{"raw_affiliation_string":"iReason, LLC, Skopje, N. Macedonia","institution_ids":[]},{"raw_affiliation_string":"Faculty of Computer Science and Engineering, Ss. Cyril and Methodius University, Skopje, N. Macedonia","institution_ids":["https://openalex.org/I76245029"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073282867","display_name":"Monika Simjanoska","orcid":"https://orcid.org/0000-0002-5028-3841"},"institutions":[{"id":"https://openalex.org/I174143326","display_name":"Macedonian Academy of Sciences and Arts","ror":"https://ror.org/003jsdw96","country_code":"MK","type":"education","lineage":["https://openalex.org/I174143326"]},{"id":"https://openalex.org/I76245029","display_name":"Saints Cyril and Methodius University of Skopje","ror":"https://ror.org/02wk2vx54","country_code":"MK","type":"education","lineage":["https://openalex.org/I76245029"]}],"countries":["MK"],"is_corresponding":false,"raw_author_name":"Monika Simjanoska","raw_affiliation_strings":["iReason, LLC,Skopje,N. Macedonia","iReason, LLC, Skopje, N. Macedonia","Faculty of Computer Science and Engineering, Ss. Cyril and Methodius University, Skopje, N. Macedonia"],"affiliations":[{"raw_affiliation_string":"iReason, LLC,Skopje,N. Macedonia","institution_ids":["https://openalex.org/I174143326"]},{"raw_affiliation_string":"iReason, LLC, Skopje, N. Macedonia","institution_ids":[]},{"raw_affiliation_string":"Faculty of Computer Science and Engineering, Ss. Cyril and Methodius University, Skopje, N. Macedonia","institution_ids":["https://openalex.org/I76245029"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5073829001"],"corresponding_institution_ids":["https://openalex.org/I174143326"],"apc_list":null,"apc_paid":null,"fwci":0.1041,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.25130636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"942","last_page":"947"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8592656850814819},{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.7403061985969543},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7232972383499146},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6851575374603271},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6541479229927063},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6163645386695862},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6102166771888733},{"id":"https://openalex.org/keywords/croatian","display_name":"Croatian","score":0.5939136147499084},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.46275660395622253},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.24462002515792847}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8592656850814819},{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.7403061985969543},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7232972383499146},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6851575374603271},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6541479229927063},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6163645386695862},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6102166771888733},{"id":"https://openalex.org/C83559648","wikidata":"https://www.wikidata.org/wiki/Q6654","display_name":"Croatian","level":2,"score":0.5939136147499084},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.46275660395622253},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.24462002515792847},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mipro55190.2022.9803646","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mipro55190.2022.9803646","pdf_url":null,"source":{"id":"https://openalex.org/S4363605136","display_name":"2022 45th Jubilee International Convention on Information, Communication and Electronic Technology (MIPRO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 45th Jubilee International Convention on Information, Communication and Electronic Technology (MIPRO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W2010595692","https://openalex.org/W2023358833","https://openalex.org/W2066792529","https://openalex.org/W2130942839","https://openalex.org/W2155591437","https://openalex.org/W2594422606","https://openalex.org/W2760493402","https://openalex.org/W2767899794","https://openalex.org/W2785047343","https://openalex.org/W2885301267","https://openalex.org/W2896457183","https://openalex.org/W2899508708","https://openalex.org/W2914120296","https://openalex.org/W2916997151","https://openalex.org/W2951559648","https://openalex.org/W2962739339","https://openalex.org/W2964132420","https://openalex.org/W2965373594","https://openalex.org/W2978017171","https://openalex.org/W3035390927","https://openalex.org/W3048123096","https://openalex.org/W3091781323","https://openalex.org/W3093050310","https://openalex.org/W3094220570","https://openalex.org/W3103161287","https://openalex.org/W3126879549","https://openalex.org/W3192770664","https://openalex.org/W3193959417","https://openalex.org/W3212628932","https://openalex.org/W4385245566","https://openalex.org/W6746141323","https://openalex.org/W6756051847","https://openalex.org/W6799788063"],"related_works":["https://openalex.org/W3049463507","https://openalex.org/W2936497627","https://openalex.org/W4288365749","https://openalex.org/W3013624417","https://openalex.org/W4287826556","https://openalex.org/W4287598411","https://openalex.org/W3098382480","https://openalex.org/W3198458223","https://openalex.org/W4288267738","https://openalex.org/W3126642501"],"abstract_inverted_index":{"Spelling":[0],"correction":[1,77,111],"plays":[2],"an":[3,74],"important":[4],"role":[5],"when":[6],"applied":[7],"in":[8,34,113],"complex":[9],"NLP-based":[10],"applications":[11],"and":[12,19,131,167],"pipelines.":[13],"Many":[14],"of":[15,36,49,68,94,101,185],"the":[16,25,31,50,53,66,69,80,92,99,114,140,144,161,168,178,192],"existing":[17],"models":[18],"techniques":[20],"are":[21,164,171],"developed":[22,188],"to":[23,55,57,106,134],"support":[24,138],"English":[26,115],"language":[27,33],"as":[28,148,183],"it":[29],"is":[30,46,119,146,180],"richest":[32],"terms":[35],"resources":[37],"available":[38],"for":[39,72,79,91,139,191],"training":[40,73,145],"such":[41],"models.":[42],"The":[43,83,117],"good":[44],"occasion":[45],"that":[47],"few":[48],"methodologies":[51],"provide":[52],"opportunity":[54],"adapt":[56],"other,":[58],"low-resource":[59],"languages.":[60],"In":[61],"this":[62],"paper,":[63],"we":[64,97],"explore":[65],"power":[67],"Neuspell":[70],"Toolkit":[71],"original":[75],"spelling":[76,110],"model":[78,179,190],"Croatian":[81,141,158,193],"language.":[82,116,142,194],"toolkit":[84],"itself":[85],"comprises":[86],"ten":[87],"different":[88,122],"models,":[89],"but":[90],"purposes":[93],"our":[95,186],"work,":[96],"use":[98],"leverage":[100],"pre-trained":[102,123],"transformer":[103],"networks":[104],"due":[105,133],"their":[107,135,174],"experimentally":[108],"proven":[109],"efficiency":[112],"comparison":[118],"performed":[120],"over":[121],"Subword":[124],"BERT":[125,128],"architectures,":[126],"including":[127],"Multilingual,":[129],"DistilBERT,":[130],"XLM-RoBERTa,":[132],"subword":[136],"representation":[137],"Furthermore,":[143],"done":[147],"a":[149,154],"sequence":[150],"labeling":[151],"task":[152],"on":[153],"newly":[155],"created":[156],"parallel":[157],"dataset":[159],"where":[160],"noisy":[162],"examples":[163],"synthetically":[165],"generated,":[166],"misspelled":[169],"words":[170],"labeled":[172],"with":[173],"correct":[175],"version.":[176],"Finally,":[177],"tested":[181],"in-vivo":[182],"part":[184],"originally":[187],"speech-to-text":[189]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
