{"id":"https://openalex.org/W4414272318","doi":"https://doi.org/10.1109/ichms65439.2025.11154211","title":"Evaluating Large Language Models for Sentiment Analysis: A Comparative Study of Accuracy and Scalability","display_name":"Evaluating Large Language Models for Sentiment Analysis: A Comparative Study of Accuracy and Scalability","publication_year":2025,"publication_date":"2025-05-26","ids":{"openalex":"https://openalex.org/W4414272318","doi":"https://doi.org/10.1109/ichms65439.2025.11154211"},"language":"en","primary_location":{"id":"doi:10.1109/ichms65439.2025.11154211","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ichms65439.2025.11154211","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 5th International Conference on Human-Machine Systems (ICHMS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119647528","display_name":"Nouf Almontashry","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099699","display_name":"Jeddah University","ror":"https://ror.org/015ya8798","country_code":"SA","type":"education","lineage":["https://openalex.org/I4210099699"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Nouf Almontashry","raw_affiliation_strings":["Computer Science &#x0026; Engineering College, University of Jeddah,KSA"],"affiliations":[{"raw_affiliation_string":"Computer Science &#x0026; Engineering College, University of Jeddah,KSA","institution_ids":["https://openalex.org/I4210099699"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119647529","display_name":"Siba Ziadi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099699","display_name":"Jeddah University","ror":"https://ror.org/015ya8798","country_code":"SA","type":"education","lineage":["https://openalex.org/I4210099699"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Siba Ziadi","raw_affiliation_strings":["Computer Science &#x0026; Engineering College, University of Jeddah,KSA"],"affiliations":[{"raw_affiliation_string":"Computer Science &#x0026; Engineering College, University of Jeddah,KSA","institution_ids":["https://openalex.org/I4210099699"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119647530","display_name":"Khadeja Njaai","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099699","display_name":"Jeddah University","ror":"https://ror.org/015ya8798","country_code":"SA","type":"education","lineage":["https://openalex.org/I4210099699"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Khadeja Njaai","raw_affiliation_strings":["Computer Science &#x0026; Engineering College, University of Jeddah,KSA"],"affiliations":[{"raw_affiliation_string":"Computer Science &#x0026; Engineering College, University of Jeddah,KSA","institution_ids":["https://openalex.org/I4210099699"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013947843","display_name":"Rabab Alomairy","orcid":"https://orcid.org/0000-0001-9911-6094"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rabab Alomairy","raw_affiliation_strings":["Massachusetts Institute of Technology,Computer Science &#x0026; Artificial Intelligence Laboratory,USA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Computer Science &#x0026; Artificial Intelligence Laboratory,USA","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5119647528"],"corresponding_institution_ids":["https://openalex.org/I4210099699"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13713067,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"413","last_page":"419"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9343000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9343000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.6805999875068665},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6259999871253967},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4839000105857849},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4595000147819519},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.3831999897956848},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.36550000309944153},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3569999933242798}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.756600022315979},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.6805999875068665},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6607999801635742},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6259999871253967},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5090000033378601},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4846999943256378},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4839000105857849},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4595000147819519},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.3831999897956848},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.36550000309944153},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3569999933242798},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.3050000071525574},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.29429998993873596},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28859999775886536},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2728999853134155},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2694999873638153}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ichms65439.2025.11154211","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ichms65439.2025.11154211","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 5th International Conference on Human-Machine Systems (ICHMS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W4388777264","https://openalex.org/W4392240262","https://openalex.org/W4392353733","https://openalex.org/W4408666997"],"related_works":[],"abstract_inverted_index":{"Sentiment":[0],"analysis":[1],"plays":[2],"a":[3,62,125],"crucial":[4],"role":[5],"in":[6,143,162,179],"natural":[7],"language":[8],"processing":[9],"(NLP)":[10],"by":[11],"enabling":[12],"machines":[13],"to":[14,80,86],"interpret":[15],"human":[16,164],"emotions":[17],"from":[18],"text.":[19],"With":[20],"the":[21,47,68,157,183],"advent":[22],"of":[23,51,101,159,185],"Large":[24],"Language":[25],"Models":[26],"(LLMs),":[27],"sentiment":[28,48,146,180],"classification":[29,49],"has":[30],"gained":[31],"renewed":[32],"interest,":[33],"as":[34],"these":[35],"models":[36,178],"exhibit":[37],"advanced":[38],"contextual":[39],"understanding":[40],"and":[41,61,82,105],"reasoning":[42,187],"capabilities.":[43],"This":[44],"study":[45],"evaluates":[46],"performance":[50,121],"state-of-the-art":[52],"LLMs,":[53],"including":[54],"GPT-4o,":[55],"GPT-3.5,":[56],"DeepSeek":[57,93,173],"R1-Reasoning,":[58],"Llama":[59,133],"2-7B,":[60],"taskspecific":[63],"fine-tuned":[64,113],"DistilBERT":[65,114],"model.":[66],"Using":[67],"IMDB":[69],"dataset,":[70],"we":[71],"assess":[72],"model":[73],"accuracy":[74,100],"across":[75],"varying":[76],"sample":[77],"sizes":[78],"(50":[79],"300)":[81],"compare":[83],"their":[84],"results":[85,167],"humanlabeled":[87],"data.":[88],"Our":[89],"findings":[90],"reveal":[91],"that":[92,169],"R1Reasoning":[94],"outperforms":[95],"all":[96],"models,":[97],"achieving":[98],"an":[99],"96%,":[102],"while":[103],"GPT-4o":[104],"GPT-3.5":[106],"closely":[107],"follow":[108],"with":[109,136,150],"93%":[110],"accuracy.":[111],"The":[112,148],"model,":[115],"despite":[116],"being":[117],"lightweight,":[118],"delivers":[119],"competitive":[120],"(88%),":[122],"making":[123],"it":[124],"viable":[126],"alternative":[127],"for":[128,145],"resource-constrained":[129],"environments.":[130],"In":[131],"contrast,":[132],"2-7B":[134],"struggles":[135],"increasing":[137],"dataset":[138],"sizes,":[139],"highlighting":[140,182],"its":[141],"limitations":[142],"generalization":[144],"classification.":[147],"comparison":[149],"human-labeled":[151],"data":[152],"(91%":[153],"accuracy)":[154],"further":[155],"underscores":[156],"reliability":[158],"top-tier":[160],"LLMs":[161,171],"replicating":[163],"judgment.":[165],"These":[166],"demonstrate":[168],"reasoning-based":[170],"like":[172],"R1":[174],"can":[175],"surpass":[176],"conventional":[177],"analysis,":[181],"value":[184],"integrating":[186],"mechanisms":[188],"into":[189],"future":[190],"NLP":[191],"advancements.":[192]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
