{"id":"https://openalex.org/W2982687734","doi":"https://doi.org/10.26615/issn.2603-2821.2019_001","title":"Normalization of Kazakh Texts","display_name":"Normalization of Kazakh Texts","publication_year":2019,"publication_date":"2019-09-15","ids":{"openalex":"https://openalex.org/W2982687734","doi":"https://doi.org/10.26615/issn.2603-2821.2019_001","mag":"2982687734"},"language":"en","primary_location":{"id":"doi:10.26615/issn.2603-2821.2019_001","is_oa":true,"landing_page_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","pdf_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Student Research Workshop Associated with RANLP 2019","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063291688","display_name":"Assina Abdussaitova","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Assina Abdussaitova","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5019241703","display_name":"Alina Amangeldiyeva","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alina Amangeldiyeva","raw_affiliation_strings":["University Computer Science Kazakhstan, Kaskelen"],"affiliations":[{"raw_affiliation_string":"University Computer Science Kazakhstan, Kaskelen","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5063291688"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.13318447,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.8618999719619751,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.8618999719619751,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kazakh","display_name":"Kazakh","score":0.9561985731124878},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.8623574376106262},{"id":"https://openalex.org/keywords/agglutinative-language","display_name":"Agglutinative language","score":0.8516383171081543},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.794161319732666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6133742928504944},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5293251872062683},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.21972313523292542}],"concepts":[{"id":"https://openalex.org/C2781297163","wikidata":"https://www.wikidata.org/wiki/Q9252","display_name":"Kazakh","level":2,"score":0.9561985731124878},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.8623574376106262},{"id":"https://openalex.org/C80875076","wikidata":"https://www.wikidata.org/wiki/Q171263","display_name":"Agglutinative language","level":3,"score":0.8516383171081543},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.794161319732666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6133742928504944},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5293251872062683},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.21972313523292542},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C165297611","wikidata":"https://www.wikidata.org/wiki/Q43249","display_name":"Morpheme","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.26615/issn.2603-2821.2019_001","is_oa":true,"landing_page_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","pdf_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Student Research Workshop Associated with RANLP 2019","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.26615/issn.2603-2821.2019_001","is_oa":true,"landing_page_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","pdf_url":"https://doi.org/10.26615/issn.2603-2821.2019_001","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Student Research Workshop Associated with RANLP 2019","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.75,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2982687734.pdf","grobid_xml":"https://content.openalex.org/works/W2982687734.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W3455125","https://openalex.org/W62785058","https://openalex.org/W1597191941","https://openalex.org/W1647671624","https://openalex.org/W1999179414","https://openalex.org/W2018616927","https://openalex.org/W2066792529","https://openalex.org/W2094980874","https://openalex.org/W2196613303","https://openalex.org/W2251290832","https://openalex.org/W2620138912","https://openalex.org/W2941509535"],"related_works":["https://openalex.org/W2363093443","https://openalex.org/W4206915444","https://openalex.org/W4388766676","https://openalex.org/W2970682420","https://openalex.org/W2539790792","https://openalex.org/W3013913162","https://openalex.org/W3204019825","https://openalex.org/W3136915866","https://openalex.org/W44901218","https://openalex.org/W2947417049"],"abstract_inverted_index":{"Kazakh,":[0],"like":[1],"other":[2],"agglutinative":[3],"languages,":[4],"has":[5,67],"specific":[6],"difficulties":[7],"on":[8,40],"both":[9],"recognition":[10],"of":[11,24,36,61,65,73,78],"wrong":[12],"words":[13],"and":[14,42,85],"generation":[15],"the":[16,34,49,79],"corrections":[17],"for":[18,33],"misspelt":[19],"words.":[20],"The":[21,59,76],"main":[22],"goal":[23],"this":[25,57],"work":[26],"is":[27,53],"to":[28],"develop":[29],"a":[30,71],"better":[31],"algorithm":[32],"normalization":[35,66],"Kazakh":[37],"texts":[38],"based":[39],"traditional":[41],"machine":[43],"learning":[44],"methods,":[45],"as":[46,48],"well":[47],"new":[50],"approach":[51],"which":[52],"also":[54],"considered":[55],"in":[56,70,88],"paper.":[58],"procedure":[60],"election":[62],"among":[63],"methods":[64],"been":[68],"conducted":[69],"manner":[72],"comparative":[74,80],"analysis.":[75],"results":[77],"analysis":[81],"turned":[82],"up":[83],"successful":[84],"are":[86],"shown":[87],"detail.":[89]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2019-11-08T00:00:00"}
