{"id":"https://openalex.org/W7125141928","doi":"https://doi.org/10.48550/arxiv.2601.12132","title":"Bengali Text Classification: An Evaluation of Large Language Model Approaches","display_name":"Bengali Text Classification: An Evaluation of Large Language Model Approaches","publication_year":2026,"publication_date":"2026-01-17","ids":{"openalex":"https://openalex.org/W7125141928","doi":"https://doi.org/10.48550/arxiv.2601.12132"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.12132","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12132","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.12132","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123523937","display_name":"Md Mahmudul Hoque","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoque, Md Mahmudul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095828819","display_name":"Md Mehedi Hassain","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hassain, Md Mehedi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123500760","display_name":"Md Hojaifa Tanvir","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tanvir, Md Hojaifa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5038766443","display_name":"Rahul Nandy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nandy, Rahul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.6035000085830688,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.6035000085830688,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.06870000064373016,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.040300000458955765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bengali","display_name":"Bengali","score":0.9943000078201294},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6819000244140625},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5514000058174133},{"id":"https://openalex.org/keywords/newspaper","display_name":"Newspaper","score":0.5216000080108643},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.45579999685287476},{"id":"https://openalex.org/keywords/scarcity","display_name":"Scarcity","score":0.38960000872612}],"concepts":[{"id":"https://openalex.org/C19235068","wikidata":"https://www.wikidata.org/wiki/Q9610","display_name":"Bengali","level":2,"score":0.9943000078201294},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7181000113487244},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6819000244140625},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6740999817848206},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6306999921798706},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5514000058174133},{"id":"https://openalex.org/C201280247","wikidata":"https://www.wikidata.org/wiki/Q11032","display_name":"Newspaper","level":2,"score":0.5216000080108643},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.45579999685287476},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.38960000872612},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3555999994277954},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.33719998598098755},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.33169999718666077},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2784999907016754}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.12132","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12132","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.12132","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12132","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8719515204429626,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Bengali":[0,21,48,135,144],"text":[1,13,136],"classification":[2,91,102,164],"is":[3,14],"a":[4,63],"Significant":[5],"task":[6,87],"in":[7,46,109,134],"natural":[8],"language":[9,34,43],"processing":[10],"(NLP),":[11],"where":[12],"categorized":[15],"into":[16],"predefined":[17],"labels.":[18],"Unlike":[19],"English,":[20],"faces":[22],"challenges":[23],"due":[24],"to":[25,162],"the":[26,39,89,94,100,110,130,139],"lack":[27],"of":[28,41,58,104,122,132,141],"extensive":[29],"annotated":[30],"datasets":[31],"and":[32,78,117,124,158],"pre-trained":[33],"models.":[35],"This":[36],"study":[37],"explores":[38],"effectiveness":[40,131],"large":[42],"models":[44],"(LLMs)":[45],"classifying":[47],"newspaper":[49],"articles.":[50],"The":[51,127],"dataset":[52],"used,":[53],"obtained":[54],"from":[55,60],"Kaggle,":[56],"consists":[57],"articles":[59],"Prothom":[61],"Alo,":[62],"major":[64],"Bangladeshi":[65],"newspaper.":[66],"Three":[67],"instruction-tuned":[68],"LLMs":[69,133],"LLaMA":[70,74,115,118],"3.1":[71,116],"8B":[72],"Instruct,":[73,77],"3.2":[75,119],"3B":[76],"Qwen":[79,97],"2.5":[80,98],"7B":[81],"Instruct":[82],"were":[83],"evaluated":[84,95],"for":[85,143],"this":[86],"under":[88],"same":[90],"framework.":[92],"Among":[93],"models,":[96,153],"achieved":[99],"highest":[101],"accuracy":[103],"72%,":[105],"showing":[106],"particular":[107],"strength":[108],"\"Sports\"":[111],"category.":[112],"In":[113],"comparison,":[114],"attained":[120],"accuracies":[121],"53%":[123],"56%,":[125],"respectively.":[126],"findings":[128],"highlight":[129],"classification,":[137],"despite":[138],"scarcity":[140],"resources":[142],"NLP.":[145],"Future":[146],"research":[147],"will":[148],"focus":[149],"on":[150],"exploring":[151],"additional":[152],"addressing":[154],"class":[155],"imbalance":[156],"issues,":[157],"refining":[159],"fine-tuning":[160],"approaches":[161],"improve":[163],"performance.":[165]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-01-22T00:00:00"}
