{"id":"https://openalex.org/W4383818636","doi":"https://doi.org/10.3390/computers12070137","title":"Unifying Sentence Transformer Embedding and Softmax Voting Ensemble for Accurate News Category Prediction","display_name":"Unifying Sentence Transformer Embedding and Softmax Voting Ensemble for Accurate News Category Prediction","publication_year":2023,"publication_date":"2023-07-08","ids":{"openalex":"https://openalex.org/W4383818636","doi":"https://doi.org/10.3390/computers12070137"},"language":"en","primary_location":{"id":"doi:10.3390/computers12070137","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers12070137","pdf_url":"https://www.mdpi.com/2073-431X/12/7/137/pdf?version=1689042915","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2073-431X/12/7/137/pdf?version=1689042915","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057208010","display_name":"Saima K. Khosa","orcid":"https://orcid.org/0000-0001-8249-2843"},"institutions":[{"id":"https://openalex.org/I174731842","display_name":"Islamia University of Bahawalpur","ror":"https://ror.org/002rc4w13","country_code":"PK","type":"education","lineage":["https://openalex.org/I174731842"]},{"id":"https://openalex.org/I4210102737","display_name":"Khwaja Fareed University of Engineering and Information Technology","ror":"https://ror.org/0161dyt30","country_code":"PK","type":"education","lineage":["https://openalex.org/I4210102737"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Saima Khosa","raw_affiliation_strings":["Department of Information Security, The Islamia University of Bahawalpur, Bahawalpur 63100, Pakistan","Department of Information Technology, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan 64200, Pakistan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Security, The Islamia University of Bahawalpur, Bahawalpur 63100, Pakistan","institution_ids":["https://openalex.org/I174731842"]},{"raw_affiliation_string":"Department of Information Technology, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan 64200, Pakistan","institution_ids":["https://openalex.org/I4210102737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087270783","display_name":"Arif Mehmood","orcid":"https://orcid.org/0000-0001-5822-4005"},"institutions":[{"id":"https://openalex.org/I174731842","display_name":"Islamia University of Bahawalpur","ror":"https://ror.org/002rc4w13","country_code":"PK","type":"education","lineage":["https://openalex.org/I174731842"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Arif Mehmood","raw_affiliation_strings":["Department of Information Security, The Islamia University of Bahawalpur, Bahawalpur 63100, Pakistan"],"raw_orcid":"https://orcid.org/0000-0001-5822-4005","affiliations":[{"raw_affiliation_string":"Department of Information Security, The Islamia University of Bahawalpur, Bahawalpur 63100, Pakistan","institution_ids":["https://openalex.org/I174731842"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073229186","display_name":"Muhammad Rizwan","orcid":"https://orcid.org/0000-0001-6286-2544"},"institutions":[{"id":"https://openalex.org/I4210102737","display_name":"Khwaja Fareed University of Engineering and Information Technology","ror":"https://ror.org/0161dyt30","country_code":"PK","type":"education","lineage":["https://openalex.org/I4210102737"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Muhammad Rizwan","raw_affiliation_strings":["Department of Information Technology, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan 64200, Pakistan"],"raw_orcid":"https://orcid.org/0000-0001-6286-2544","affiliations":[{"raw_affiliation_string":"Department of Information Technology, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan 64200, Pakistan","institution_ids":["https://openalex.org/I4210102737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5073229186"],"corresponding_institution_ids":["https://openalex.org/I4210102737"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":1.3254,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.84225448,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"12","issue":"7","first_page":"137","last_page":"137"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.9314465522766113},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.7566680908203125},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6390939950942993},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5876805782318115},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.53528892993927},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5326003432273865},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5164273381233215},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.5099164247512817},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4753924608230591},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4557781219482422},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.4414242208003998},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4383038282394409},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4172121286392212},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3804967999458313},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.20767349004745483}],"concepts":[{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.9314465522766113},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.7566680908203125},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6390939950942993},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5876805782318115},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.53528892993927},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5326003432273865},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5164273381233215},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.5099164247512817},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4753924608230591},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4557781219482422},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.4414242208003998},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4383038282394409},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4172121286392212},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3804967999458313},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.20767349004745483},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/computers12070137","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers12070137","pdf_url":"https://www.mdpi.com/2073-431X/12/7/137/pdf?version=1689042915","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b661eede3525486b95c536f726e29bc9","is_oa":true,"landing_page_url":"https://doaj.org/article/b661eede3525486b95c536f726e29bc9","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers, Vol 12, Iss 7, p 137 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/computers12070137","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers12070137","pdf_url":"https://www.mdpi.com/2073-431X/12/7/137/pdf?version=1689042915","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4383818636.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W2947919375","https://openalex.org/W2948589047","https://openalex.org/W2969545244","https://openalex.org/W2982112604","https://openalex.org/W3008340068","https://openalex.org/W3097652332","https://openalex.org/W3105816068","https://openalex.org/W3122116274","https://openalex.org/W3139958517","https://openalex.org/W3147153144","https://openalex.org/W3158558892","https://openalex.org/W3163378241","https://openalex.org/W3175962275","https://openalex.org/W3183676217","https://openalex.org/W3199353897","https://openalex.org/W3202548348","https://openalex.org/W3214828763","https://openalex.org/W4200040201","https://openalex.org/W4200233281","https://openalex.org/W4200245209","https://openalex.org/W4200455899","https://openalex.org/W4281748497","https://openalex.org/W4287888702","https://openalex.org/W4293462507","https://openalex.org/W4293767192","https://openalex.org/W4294133266","https://openalex.org/W4294343992","https://openalex.org/W4312590785","https://openalex.org/W4312875997","https://openalex.org/W4318484691","https://openalex.org/W4322746638","https://openalex.org/W4385573170","https://openalex.org/W6803943978"],"related_works":["https://openalex.org/W3107204728","https://openalex.org/W4287591324","https://openalex.org/W4226420367","https://openalex.org/W2980176872","https://openalex.org/W2962876041","https://openalex.org/W3090555870","https://openalex.org/W3108503355","https://openalex.org/W2249953602","https://openalex.org/W3134502938","https://openalex.org/W1980222719"],"abstract_inverted_index":{"The":[0,43,93,121,135,154,239,260],"study":[1,122],"focuses":[2],"on":[3],"news":[4,39,91,296],"category":[5,297],"prediction":[6],"and":[7,21,23,33,49,97,119,131,161,226,249,257,266,274,292],"investigates":[8],"the":[9,67,73,86,90,103,127,143,150,164,180,199,211,214,235,243,280,283],"performance":[10,94,128,144,245],"of":[11,14,56,89,95,106,129,145,168,184,207,216,246,254,282],"sentence":[12,83,232],"embedding":[13,178],"four":[15],"transformer":[16,64,147,218,264,287],"models":[17],"(BERT,":[18],"RoBERTa,":[19],"MPNet,":[20],"T5)":[22],"their":[24],"variants":[25],"as":[26,72,100,102,114,221],"feature":[27],"vectors":[28],"when":[29,170,186,196,228],"combined":[30,171],"with":[31,66,172,188,286],"Softmax":[32,96,130,189,255],"Random":[34,98,132,173,236,258],"Forest":[35,133,237],"using":[36,63,110],"two":[37],"accessible":[38],"datasets":[40],"from":[41],"Kaggle.":[42],"data":[44],"are":[45,61],"stratified":[46],"into":[47],"train":[48],"test":[50],"sets":[51],"to":[52,141,230],"ensure":[53],"equal":[54],"representation":[55,81],"each":[57],"category.":[58],"Word":[59],"embeddings":[60,148,233,265,288],"generated":[62],"models,":[65,219],"last":[68],"hidden":[69],"layer":[70],"selected":[71],"embedding.":[74],"Mean":[75],"pooling":[76],"calculates":[77],"a":[78],"single":[79],"vector":[80],"called":[82],"embedding,":[84],"capturing":[85],"overall":[87],"meaning":[88],"article.":[92],"Forest,":[99,174],"well":[101,195],"soft":[104],"voting":[105,200,253,261,284],"both,":[107],"is":[108,139],"evaluated":[109],"evaluation":[111],"measures":[112],"such":[113,220],"accuracy,":[115],"F1":[116,137,166,182,205],"score,":[117],"precision,":[118],"recall.":[120],"also":[123,241],"contributes":[124],"by":[125],"evaluating":[126],"individually.":[134],"macro-average":[136],"score":[138,167,183,206],"calculated":[140],"compare":[142],"different":[146],"in":[149,198,252,289],"same":[151],"experimental":[152],"settings.":[153],"experiments":[155,212],"reveal":[156],"that":[157],"MPNet":[158,191,222,224],"versions":[159],"v1":[160,192],"v3":[162],"achieve":[163],"highest":[165,181],"97.7%":[169],"while":[175],"T5":[176,247],"Large":[177,248,251],"achieves":[179],"98.2%":[185],"used":[187,197,229],"regression.":[190],"performs":[193],"exceptionally":[194],"classifier,":[201,262],"obtaining":[202],"an":[203],"impressive":[204],"98.6%.":[208],"In":[209],"conclusion,":[210],"validate":[213],"superiority":[215],"certain":[217],"v1,":[223],"v3,":[225],"DistilRoBERTa,":[227],"calculate":[231],"within":[234],"framework.":[238],"results":[240],"highlight":[242],"promising":[244],"RoBERTa":[250],"regression":[256],"Forest.":[259],"employing":[263],"ensemble":[267],"learning":[268],"techniques,":[269],"consistently":[270],"outperforms":[271],"other":[272],"baselines":[273],"individual":[275],"algorithms.":[276],"These":[277],"findings":[278],"emphasize":[279],"effectiveness":[281],"classifier":[285],"achieving":[290],"accurate":[291],"reliable":[293],"predictions":[294],"for":[295],"classification":[298],"tasks.":[299]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2023-07-11T00:00:00"}
