{"id":"https://openalex.org/W4407394771","doi":"https://doi.org/10.3103/s0146411624700329","title":"Text Classification by CEFR Levels Using Machine Learning Methods and the BERT Language Model","display_name":"Text Classification by CEFR Levels Using Machine Learning Methods and the BERT Language Model","publication_year":2024,"publication_date":"2024-12-01","ids":{"openalex":"https://openalex.org/W4407394771","doi":"https://doi.org/10.3103/s0146411624700329"},"language":"en","primary_location":{"id":"doi:10.3103/s0146411624700329","is_oa":false,"landing_page_url":"https://doi.org/10.3103/s0146411624700329","pdf_url":null,"source":{"id":"https://openalex.org/S17203304","display_name":"Automatic Control and Computer Sciences","issn_l":"0146-4116","issn":["0146-4116","1558-108X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320267","host_organization_name":"Pleiades Publishing","host_organization_lineage":["https://openalex.org/P4310320267","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Pleiades Publishing","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Automatic Control and Computer Sciences","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040198515","display_name":"Nadezhda Lagutina","orcid":"https://orcid.org/0000-0002-6137-8643"},"institutions":[{"id":"https://openalex.org/I198371094","display_name":"Yaroslavl State University","ror":"https://ror.org/044s2fj67","country_code":"RU","type":"education","lineage":["https://openalex.org/I198371094"]}],"countries":["RU"],"is_corresponding":true,"raw_author_name":"N. S. Lagutina","raw_affiliation_strings":["Demidov Yaroslavl State University, 150003, Yaroslavl, Russia"],"raw_orcid":"https://orcid.org/0000-0002-6137-8643","affiliations":[{"raw_affiliation_string":"Demidov Yaroslavl State University, 150003, Yaroslavl, Russia","institution_ids":["https://openalex.org/I198371094"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002941314","display_name":"Ksenia Lagutina","orcid":"https://orcid.org/0000-0002-1742-3240"},"institutions":[{"id":"https://openalex.org/I198371094","display_name":"Yaroslavl State University","ror":"https://ror.org/044s2fj67","country_code":"RU","type":"education","lineage":["https://openalex.org/I198371094"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"K. V. Lagutina","raw_affiliation_strings":["Demidov Yaroslavl State University, 150003, Yaroslavl, Russia"],"raw_orcid":"https://orcid.org/0000-0002-1742-3240","affiliations":[{"raw_affiliation_string":"Demidov Yaroslavl State University, 150003, Yaroslavl, Russia","institution_ids":["https://openalex.org/I198371094"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093021186","display_name":"Anastasya M. Brederman","orcid":"https://orcid.org/0009-0003-1741-0604"},"institutions":[{"id":"https://openalex.org/I198371094","display_name":"Yaroslavl State University","ror":"https://ror.org/044s2fj67","country_code":"RU","type":"education","lineage":["https://openalex.org/I198371094"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"A. M. Brederman","raw_affiliation_strings":["Demidov Yaroslavl State University, 150003, Yaroslavl, Russia"],"raw_orcid":"https://orcid.org/0009-0003-1741-0604","affiliations":[{"raw_affiliation_string":"Demidov Yaroslavl State University, 150003, Yaroslavl, Russia","institution_ids":["https://openalex.org/I198371094"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053710320","display_name":"Natalia N. Kasatkina","orcid":"https://orcid.org/0000-0002-6757-9622"},"institutions":[{"id":"https://openalex.org/I198371094","display_name":"Yaroslavl State University","ror":"https://ror.org/044s2fj67","country_code":"RU","type":"education","lineage":["https://openalex.org/I198371094"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"N. N. Kasatkina","raw_affiliation_strings":["Demidov Yaroslavl State University, 150003, Yaroslavl, Russia"],"raw_orcid":"https://orcid.org/0000-0002-6757-9622","affiliations":[{"raw_affiliation_string":"Demidov Yaroslavl State University, 150003, Yaroslavl, Russia","institution_ids":["https://openalex.org/I198371094"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5040198515"],"corresponding_institution_ids":["https://openalex.org/I198371094"],"apc_list":null,"apc_paid":null,"fwci":3.3114,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.93353627,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"58","issue":"7","first_page":"869","last_page":"878"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9381155967712402},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.669651985168457},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6286795139312744},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5758559107780457},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34463775157928467}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9381155967712402},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.669651985168457},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6286795139312744},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5758559107780457},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34463775157928467}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3103/s0146411624700329","is_oa":false,"landing_page_url":"https://doi.org/10.3103/s0146411624700329","pdf_url":null,"source":{"id":"https://openalex.org/S17203304","display_name":"Automatic Control and Computer Sciences","issn_l":"0146-4116","issn":["0146-4116","1558-108X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320267","host_organization_name":"Pleiades Publishing","host_organization_lineage":["https://openalex.org/P4310320267","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Pleiades Publishing","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Automatic Control and Computer Sciences","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6499999761581421,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2952889708","https://openalex.org/W2963341956","https://openalex.org/W2970868759","https://openalex.org/W2978017171","https://openalex.org/W3037207300","https://openalex.org/W3159985722","https://openalex.org/W3170447087","https://openalex.org/W3201077663","https://openalex.org/W3205393847","https://openalex.org/W3212104084","https://openalex.org/W4205533984","https://openalex.org/W4210261798","https://openalex.org/W4212926655","https://openalex.org/W4287855117","https://openalex.org/W4312701156","https://openalex.org/W4361026235","https://openalex.org/W4381137031","https://openalex.org/W4385571576","https://openalex.org/W4385572889"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"This":[0,86,163],"paper":[1],"presents":[2,88],"a":[3,33,42,228],"study":[4],"of":[5,8,11,22,30,40,67,91,155,170,186,190,196,209,211,218,236,252,260],"the":[6,20,23,28,63,68,81,89,92,109,113,129,148,158,168,171,207,212,216,223,234,237,246,250,258],"problem":[7],"automatic":[9,253],"classification":[10,133,191,219],"short":[12],"coherent":[13],"texts":[14],"(essays)":[15],"in":[16,32,49,231],"English":[17,122,161],"according":[18],"to":[19,143],"levels":[21,138],"international":[24],"CEFR":[25,120,137,159],"scale.":[26],"Determining":[27],"level":[29,255],"text":[31,57,118,224,239,254],"natural":[34],"language":[35,173],"is":[36,165,203],"an":[37,153,183],"important":[38],"component":[39],"assessing":[41],"student\u2019s":[43],"knowledge,":[44],"including":[45],"checking":[46],"open":[47,117],"tasks":[48],"e-learning":[50],"systems.":[51],"To":[52],"solve":[53],"this":[54],"problem,":[55],"vector":[56],"models":[58,240],"are":[59,78,126,145,198],"considered":[60],"based":[61],"on":[62,222],"stylometric":[64],"numerical":[65],"features":[66],"character,":[69],"word,":[70],"and":[71,104,108,124,139,257],"sentence":[72],"structure":[73],"levels.":[74],"The":[75,131,178,188],"obtained":[76,248],"vectors":[77],"classified":[79],"by":[80,147],"standard":[82],"machine":[83],"learning":[84],"classifiers.":[85],"article":[87],"results":[90,134,247],"three":[93],"most":[94,195],"successful":[95],"ones:":[96],"Support":[97,149],"Vector":[98,150],"Classifier,":[99,103],"Stochastic":[100],"Gradient":[101],"Descent":[102],"LogisticRegression.":[105],"Precision,":[106],"comprehensiveness,":[107],"F-measure":[110],"served":[111],"as":[112],"quality":[114,217],"measures.":[115],"Two":[116],"corpora,":[119],"Levelled":[121,160],"Texts":[123],"BEA-2019,":[125],"chosen":[127],"for":[128,135,157,241],"experiments.":[130],"best":[132,179],"six":[136],"sublevels":[140],"from":[141,206],"A1":[142],"C2":[144],"shown":[146],"Classifier":[151],"with":[152,167],"F-score":[154,184],"67%":[156],"Texts.":[162],"approach":[164],"compared":[166],"application":[169,235],"BERT":[172],"model":[174],"(six":[175],"different":[176,242],"variants).":[177],"model,":[180],"bert-base-cased,":[181],"provided":[182],"value":[185],"69%.":[187],"analysis":[189],"errors":[192],"shows":[193],"that":[194],"them":[197],"between":[199],"neighboring":[200],"levels,":[201],"which":[202,226],"quite":[204],"understandable":[205],"point":[208],"view":[210],"domain.":[213],"In":[214,244],"addition,":[215],"strongly":[220],"depends":[221],"corpus,":[225],"demonstrates":[227],"significant":[229],"difference":[230],"F-scores":[232],"during":[233],"same":[238],"corpora.":[243],"general,":[245],"show":[249],"effectiveness":[251],"determination":[256],"possibility":[259],"its":[261],"practical":[262],"application.":[263]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
