{"id":"https://openalex.org/W4415048073","doi":"https://doi.org/10.1109/access.2025.3620264","title":"Performance of Classification Algorithms Under Class Imbalance: Simulation and Real-World Evidence","display_name":"Performance of Classification Algorithms Under Class Imbalance: Simulation and Real-World Evidence","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4415048073","doi":"https://doi.org/10.1109/access.2025.3620264"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3620264","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3620264","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3620264","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Iqra Arshad","orcid":null},"institutions":[{"id":"https://openalex.org/I12469534","display_name":"Quaid-i-Azam University","ror":"https://ror.org/04s9hft57","country_code":"PK","type":"education","lineage":["https://openalex.org/I12469534"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Iqra Arshad","raw_affiliation_strings":["Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan","institution_ids":["https://openalex.org/I12469534"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106375340","display_name":"Muhammad Umair","orcid":"https://orcid.org/0000-0001-6119-5241"},"institutions":[{"id":"https://openalex.org/I12469534","display_name":"Quaid-i-Azam University","ror":"https://ror.org/04s9hft57","country_code":"PK","type":"education","lineage":["https://openalex.org/I12469534"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Umair","raw_affiliation_strings":["Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan"],"raw_orcid":"https://orcid.org/0000-0001-6119-5241","affiliations":[{"raw_affiliation_string":"Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan","institution_ids":["https://openalex.org/I12469534"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066747669","display_name":"Faheem Jan","orcid":"https://orcid.org/0000-0002-7788-206X"},"institutions":[{"id":"https://openalex.org/I1305695959","display_name":"Bacha Khan University","ror":"https://ror.org/02an6vg71","country_code":"PK","type":"education","lineage":["https://openalex.org/I1305695959"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Faheem Jan","raw_affiliation_strings":["Department of Mathematics and Statistics, Bacha Khan University, Charsadda, Pakistan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematics and Statistics, Bacha Khan University, Charsadda, Pakistan","institution_ids":["https://openalex.org/I1305695959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080132651","display_name":"Hasnain Iftikhar","orcid":"https://orcid.org/0000-0002-8533-5410"},"institutions":[{"id":"https://openalex.org/I12469534","display_name":"Quaid-i-Azam University","ror":"https://ror.org/04s9hft57","country_code":"PK","type":"education","lineage":["https://openalex.org/I12469534"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Hasnain Iftikhar","raw_affiliation_strings":["Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan"],"raw_orcid":"https://orcid.org/0000-0002-8533-5410","affiliations":[{"raw_affiliation_string":"Department of Statistics, Quaid-i-Azam University, Islamabad, Pakistan","institution_ids":["https://openalex.org/I12469534"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024974930","display_name":"Paulo Canas Rodrigues","orcid":"https://orcid.org/0000-0002-1248-9910"},"institutions":[{"id":"https://openalex.org/I126158947","display_name":"Universidade Federal da Bahia","ror":"https://ror.org/03k3p7647","country_code":"BR","type":"education","lineage":["https://openalex.org/I126158947"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Paulo Canas Rodrigues","raw_affiliation_strings":["Department of Statistics, Federal University of Bahia, Salvador, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-1248-9910","affiliations":[{"raw_affiliation_string":"Department of Statistics, Federal University of Bahia, Salvador, Brazil","institution_ids":["https://openalex.org/I126158947"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ronny Ivan Gonzales Medina","orcid":null},"institutions":[{"id":"https://openalex.org/I3133295647","display_name":"National University Toribio Rodr\u00edguez de Mendoza","ror":"https://ror.org/0323wfn23","country_code":"PE","type":"education","lineage":["https://openalex.org/I3133295647"]},{"id":"https://openalex.org/I4210160924","display_name":"Universidad Panamericana","ror":"https://ror.org/05pd6sh18","country_code":"GT","type":"education","lineage":["https://openalex.org/I4210160924"]}],"countries":["GT","PE"],"is_corresponding":false,"raw_author_name":"Ronny Ivan Gonzales Medina","raw_affiliation_strings":["Facultad de Ciencias e Ingenier&#x00ED;as f&#x00ED;sicas y formales, Universidad Cat&#x00F3;lica de Santa Mar&#x00ED;a, Arequipa, Peru","Instituto de Investigaci&#x00F3;n de Estudios Estad&#x00ED;sticos y Control de Calidad, Universidad Nacional Toribio Rodr&#x00ED;guez de Mendoza, Chachapoyas, Peru"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Facultad de Ciencias e Ingenier&#x00ED;as f&#x00ED;sicas y formales, Universidad Cat&#x00F3;lica de Santa Mar&#x00ED;a, Arequipa, Peru","institution_ids":["https://openalex.org/I4210160924"]},{"raw_affiliation_string":"Instituto de Investigaci&#x00F3;n de Estudios Estad&#x00ED;sticos y Control de Calidad, Universidad Nacional Toribio Rodr&#x00ED;guez de Mendoza, Chachapoyas, Peru","institution_ids":["https://openalex.org/I3133295647"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030048049","display_name":"Javier Linkolk L\u00f3pez\u2010Gonzales","orcid":"https://orcid.org/0000-0003-0847-0552"},"institutions":[{"id":"https://openalex.org/I4210140760","display_name":"Universidad Peruana Uni\u00f3n","ror":"https://ror.org/042gckq23","country_code":"PE","type":"education","lineage":["https://openalex.org/I4210140760"]}],"countries":["PE"],"is_corresponding":false,"raw_author_name":"Javier Linkolk L\u00f3pez-Gonzales","raw_affiliation_strings":["Escuela de Posgrado, Universidad Peruana Uni&#x00F3;n, Lima, Peru"],"raw_orcid":"https://orcid.org/0000-0003-0847-0552","affiliations":[{"raw_affiliation_string":"Escuela de Posgrado, Universidad Peruana Uni&#x00F3;n, Lima, Peru","institution_ids":["https://openalex.org/I4210140760"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I12469534"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":6.2328,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96367323,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"13","issue":null,"first_page":"179672","last_page":"179685"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11653","display_name":"Financial Distress and Bankruptcy Prediction","score":0.9228000044822693,"subfield":{"id":"https://openalex.org/subfields/1402","display_name":"Accounting"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.7555999755859375},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.7218999862670898},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6965000033378601},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6632999777793884},{"id":"https://openalex.org/keywords/statistical-classification","display_name":"Statistical classification","score":0.5343999862670898},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4691999852657318},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.3928000032901764},{"id":"https://openalex.org/keywords/logistic-model-tree","display_name":"Logistic model tree","score":0.3885999917984009}],"concepts":[{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.7555999755859375},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.7218999862670898},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7178000211715698},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7088000178337097},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7077999711036682},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6965000033378601},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6632999777793884},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.5343999862670898},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4691999852657318},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.3928000032901764},{"id":"https://openalex.org/C61722155","wikidata":"https://www.wikidata.org/wiki/Q6667643","display_name":"Logistic model tree","level":3,"score":0.3885999917984009},{"id":"https://openalex.org/C123860398","wikidata":"https://www.wikidata.org/wiki/Q6934605","display_name":"Multiclass classification","level":3,"score":0.3546999990940094},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35440000891685486},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.34529998898506165},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.33709999918937683},{"id":"https://openalex.org/C139532973","wikidata":"https://www.wikidata.org/wiki/Q2679259","display_name":"Linear classifier","level":3,"score":0.3368000090122223},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.33090001344680786},{"id":"https://openalex.org/C34872919","wikidata":"https://www.wikidata.org/wiki/Q7092302","display_name":"One-class classification","level":3,"score":0.3273000121116638},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.2800999879837036},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26089999079704285}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3620264","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3620264","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:fb78969af0554a91ab426f3a6fb25e0c","is_oa":true,"landing_page_url":"https://doaj.org/article/fb78969af0554a91ab426f3a6fb25e0c","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 179672-179685 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3620264","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3620264","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Class":[0],"imbalance":[1,37],"is":[2,99,154],"a":[3,125,134],"persistent":[4],"challenge":[5],"in":[6,10,102,111,187],"machine":[7],"learning,":[8],"particularly":[9],"high-stakes":[11],"applications":[12],"such":[13],"as":[14],"medical":[15],"diagnostics,":[16],"bioinformatics,":[17],"and":[18,72,89,116,166,184],"fraud":[19],"detection,":[20],"where":[21,163],"the":[22,34,51],"minority":[23,55,138],"class":[24,109,139],"often":[25],"represents":[26],"critical":[27],"cases.":[28],"While":[29],"prior":[30],"research":[31],"has":[32,43],"examined":[33],"effect":[35],"of":[36,54,113],"on":[38,156],"classifier":[39,141],"performance,":[40],"little":[41],"attention":[42],"been":[44],"paid":[45],"to":[46,58],"establishing":[47,172],"practical":[48,135,179],"guidelines":[49],"for":[50,124,137,181],"minimum":[52],"proportion":[53],"samples":[56,147],"required":[57],"achieve":[59],"reliable":[60],"sensitivity.":[61,170],"In":[62],"this":[63,176],"study,":[64],"we":[65,132],"conduct":[66],"extensive":[67],"simulations":[68],"using":[69],"synthetic":[70],"datasets":[71],"evaluate":[73],"five":[74],"widely":[75],"used":[76],"classification":[77,189],"algorithms:":[78],"Logistic":[79],"Regression":[80],"(Logit),":[81],"Support":[82],"Vector":[83],"Machines":[84],"(SVM),":[85],"Random":[86],"Forest,":[87],"XGBoost,":[88],"Neural":[90,119,164],"Networks":[91,165],"(NNs).":[92],"Our":[93],"analysis":[94],"reveals":[95],"that":[96],"logistic":[97,129],"regression":[98],"more":[100],"effective":[101],"identifying":[103],"minority-class":[104],"instances":[105],"under":[106],"an":[107,173],"imbalanced":[108,188],"distribution":[110,127],"terms":[112],"F1":[114],"score":[115],"sensitivity,":[117],"whereas":[118],"Network":[120],"slightly":[121],"performs":[122],"better":[123],"balanced-class":[126],"than":[128],"regression.":[130],"Importantly,":[131],"identify":[133],"threshold":[136],"representation:":[140],"sensitivity":[142],"declines":[143],"sharply":[144],"when":[145],"positive":[146],"fall":[148],"below":[149],"approximately":[150],"25\u201330%.":[151],"This":[152],"finding":[153],"validated":[155],"eight":[157],"real-world":[158],"datasets,":[159],"including":[160],"large-scale":[161],"applications,":[162],"XGBoost":[167],"demonstrate":[168],"superior":[169],"By":[171],"actionable":[174],"threshold,":[175],"study":[177],"contributes":[178],"guidance":[180],"dataset":[182],"design":[183],"model":[185],"selection":[186],"problems.":[190]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-11T00:00:00"}
