{"id":"https://openalex.org/W4376273932","doi":"https://doi.org/10.3390/data8050089","title":"A Comprehensive Dataset of Spelling Errors and Users\u2019 Corrections in Croatian Language","display_name":"A Comprehensive Dataset of Spelling Errors and Users\u2019 Corrections in Croatian Language","publication_year":2023,"publication_date":"2023-05-12","ids":{"openalex":"https://openalex.org/W4376273932","doi":"https://doi.org/10.3390/data8050089"},"language":"en","primary_location":{"id":"doi:10.3390/data8050089","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8050089","pdf_url":"https://www.mdpi.com/2306-5729/8/5/89/pdf?version=1684135949","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2306-5729/8/5/89/pdf?version=1684135949","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037067710","display_name":"Gordan Gledec","orcid":"https://orcid.org/0000-0003-4188-6357"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":true,"raw_author_name":"Gordan Gledec","raw_affiliation_strings":["Department of Applied Computing, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia"],"raw_orcid":"https://orcid.org/0000-0003-4188-6357","affiliations":[{"raw_affiliation_string":"Department of Applied Computing, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058605862","display_name":"Marko Horvat","orcid":"https://orcid.org/0000-0002-3439-7216"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Marko Horvat","raw_affiliation_strings":["Department of Applied Computing, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia"],"raw_orcid":"https://orcid.org/0000-0002-3439-7216","affiliations":[{"raw_affiliation_string":"Department of Applied Computing, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051477039","display_name":"Miljenko Mikuc","orcid":"https://orcid.org/0000-0002-6408-4405"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Miljenko Mikuc","raw_affiliation_strings":["Department of Telecommunications, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Telecommunications, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079091830","display_name":"B. Blaskovic","orcid":"https://orcid.org/0000-0001-9612-4769"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Bruno Bla\u0161kovi\u0107","raw_affiliation_strings":["Department of Electrical Engineering Fundamentals and Measurements, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia"],"raw_orcid":"https://orcid.org/0000-0001-9612-4769","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering Fundamentals and Measurements, Faculty of Electrical Engineering and Computing, University of Zagreb, Unska 3, HR-10000 Zagreb, Croatia","institution_ids":["https://openalex.org/I181343428"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5037067710"],"corresponding_institution_ids":["https://openalex.org/I181343428"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":0.8065,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.77275964,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":"8","issue":"5","first_page":"89","last_page":"89"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8288059830665588},{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.828033447265625},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6420069336891174},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6123483777046204},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4901367127895355},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4304009974002838},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.41123533248901367},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.18197423219680786}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8288059830665588},{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.828033447265625},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6420069336891174},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6123483777046204},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4901367127895355},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4304009974002838},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.41123533248901367},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.18197423219680786},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/data8050089","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8050089","pdf_url":"https://www.mdpi.com/2306-5729/8/5/89/pdf?version=1684135949","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:gam:jdataj:v:8:y:2023:i:5:p:89-:d:1145798","is_oa":false,"landing_page_url":"https://www.mdpi.com/2306-5729/8/5/89/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:doaj.org/article:42b73256bf5343e5be2d1ff0709dcbaf","is_oa":true,"landing_page_url":"https://doaj.org/article/42b73256bf5343e5be2d1ff0709dcbaf","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data, Vol 8, Iss 5, p 89 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2306-5729/8/5/89/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/data8050089","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data; Volume 8; Issue 5; Pages: 89","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/data8050089","is_oa":true,"landing_page_url":"https://doi.org/10.3390/data8050089","pdf_url":"https://www.mdpi.com/2306-5729/8/5/89/pdf?version=1684135949","source":{"id":"https://openalex.org/S4210226510","display_name":"Data","issn_l":"2306-5729","issn":["2306-5729"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8700000047683716,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4376273932.pdf"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W1967932898","https://openalex.org/W1971714722","https://openalex.org/W2066792529","https://openalex.org/W2108494079","https://openalex.org/W2296213241","https://openalex.org/W2731701007","https://openalex.org/W2740691457","https://openalex.org/W2745251428","https://openalex.org/W2770994574","https://openalex.org/W2891047772","https://openalex.org/W2980440349","https://openalex.org/W2994956951","https://openalex.org/W3083208972","https://openalex.org/W3093050310","https://openalex.org/W3176301080","https://openalex.org/W3181525942","https://openalex.org/W3205378831","https://openalex.org/W3213770309","https://openalex.org/W4214486444","https://openalex.org/W4298840395","https://openalex.org/W4307703618"],"related_works":["https://openalex.org/W2161008081","https://openalex.org/W2100947578","https://openalex.org/W1555832326","https://openalex.org/W2775554247","https://openalex.org/W2110168585","https://openalex.org/W3107474891","https://openalex.org/W2250213760","https://openalex.org/W4386247111","https://openalex.org/W4327642362","https://openalex.org/W2587014613"],"abstract_inverted_index":{"This":[0,169],"paper":[1],"presents":[2],"a":[3,45,152,177],"unique":[4],"and":[5,50,63,85,89,98,109,118,124,139,156,174,190],"extensive":[6],"dataset":[7,68,171],"containing":[8],"over":[9],"33":[10],"million":[11],"entries":[12],"with":[13,176],"pairs":[14],"in":[15,52,186,193],"the":[16,24,38,53,113,145,149,157,167,182,194],"form":[17],"\u201cspelling":[18],"error":[19],"\u2192":[20],"correction\u201d":[21],"from":[22,37],"ispravi.me,":[23],"most":[25,114],"popular":[26],"Croatian":[27,146,195],"online":[28],"spellchecking":[29,78],"service,":[30],"collected":[31],"since":[32],"2008.":[33],"The":[34,67],"dataset,":[35],"compiled":[36],"contribution":[39],"of":[40,55,151,159,166,179],"nearly":[41],"900,000":[42],"users,":[43],"is":[44],"valuable":[46],"resource":[47],"for":[48,184],"researchers":[49,173],"developers":[51],"field":[54],"natural":[56],"language":[57,64,93,147,188],"processing":[58],"(NLP),":[59],"improving":[60,77,132],"spellcheck":[61],"accuracy,":[62],"learning":[65],"applications.":[66],"may":[69],"be":[70],"used":[71],"to":[72,111,144],"accomplish":[73],"several":[74],"goals:":[75],"(1)":[76],"accuracy":[79],"by":[80],"incorporating":[81],"common":[82,96,115],"user":[83],"corrections":[84],"reducing":[86],"false":[87],"positives":[88],"negatives;":[90],"(2)":[91],"helping":[92],"learners":[94],"identify":[95],"errors":[97,117],"learn":[99],"correct":[100],"spelling":[101,116],"through":[102],"targeted":[103],"feedback;":[104],"(3)":[105],"analyzing":[106],"data":[107],"trends":[108],"patterns":[110],"uncover":[112],"their":[119],"underlying":[120],"causes;":[121],"(4)":[122],"identifying":[123],"evaluating":[125],"factors":[126],"that":[127],"influence":[128],"typing":[129],"input;":[130],"(5)":[131],"NLP":[133,191],"applications":[134,192],"such":[135],"as":[136],"text":[137],"recognition":[138],"machine":[140],"translation.":[141],"Tasks":[142],"specific":[143],"include":[148],"creation":[150],"letter-level":[153],"confusion":[154],"matrix":[155],"refinement":[158],"word":[160],"suggestions":[161],"based":[162],"on":[163],"historical":[164],"usage":[165],"service.":[168],"comprehensive":[170],"provides":[172],"practitioners":[175],"wealth":[178],"information,":[180],"opening":[181],"path":[183],"advancements":[185],"spellchecking,":[187],"learning,":[189],"language.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2023-05-13T00:00:00"}
