{"id":"https://openalex.org/W7133340190","doi":"https://doi.org/10.48550/arxiv.2603.00208","title":"Tipping the Balance: Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models","display_name":"Tipping the Balance: Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models","publication_year":2026,"publication_date":"2026-02-27","ids":{"openalex":"https://openalex.org/W7133340190","doi":"https://doi.org/10.48550/arxiv.2603.00208"},"language":"en","primary_location":{"id":"pmh:oai:pure.atira.dk:openaire/b4929c91-b7bc-476c-b1ff-a7570623bc56","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2603.00208","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Andersen, A K, Mehdizavareh, M H, Khan, A, Becher, T, Britsch, S, Britsch, M, B\u00f6ttcher, M, Winther, S, Rohde, P D, Jensen, M H & Cichosz, S L 2026 'Tipping the Balance : Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models' arXiv. https://doi.org/10.48550/arXiv.2603.00208","raw_type":"workingPaper"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2603.00208","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127903586","display_name":"Amalie Koch Andersen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andersen, Amalie Koch","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114637494","display_name":"Hadi Mehdizavareh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mehdizavareh, Hadi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101527714","display_name":"Arijit Khan","orcid":"https://orcid.org/0000-0002-5234-7423"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khan, Arijit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085027781","display_name":"Tobias Becher","orcid":"https://orcid.org/0000-0001-7670-757X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Becher, Tobias","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042330789","display_name":"Simone Britsch","orcid":"https://orcid.org/0009-0001-2212-4114"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Britsch, Simone","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009377179","display_name":"M. Britsch","orcid":"https://orcid.org/0009-0004-7257-6057"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Britsch, Markward","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"B\u00f8ttcher, Morten","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"B\u00f8ttcher, Morten","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124323775","display_name":"S Winther","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Winther, Simon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111165048","display_name":"Palle Duun Rohde","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rohde, Palle Duun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127971036","display_name":"Morten Steen Kvistholm Jensen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jensen, Morten Hasselstr\u00f8m","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5114637495","display_name":"Simon Lebech Cichosz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cichosz, Simon Lebech","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.260699987411499,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.260699987411499,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.2152000069618225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.1535000056028366,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/brier-score","display_name":"Brier score","score":0.8664000034332275},{"id":"https://openalex.org/keywords/resampling","display_name":"Resampling","score":0.8525000214576721},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.6521000266075134},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5936999917030334},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.5221999883651733},{"id":"https://openalex.org/keywords/receiver-operating-characteristic","display_name":"Receiver operating characteristic","score":0.5101000070571899},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.47269999980926514}],"concepts":[{"id":"https://openalex.org/C35405484","wikidata":"https://www.wikidata.org/wiki/Q4967066","display_name":"Brier score","level":2,"score":0.8664000034332275},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.8525000214576721},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.6521000266075134},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5936999917030334},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5390999913215637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5306000113487244},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.5221999883651733},{"id":"https://openalex.org/C58471807","wikidata":"https://www.wikidata.org/wiki/Q327120","display_name":"Receiver operating characteristic","level":2,"score":0.5101000070571899},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.47269999980926514},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44440001249313354},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.44279998540878296},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.4124999940395355},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3711000084877014},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.3684999942779541},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.3402999937534332},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.32850000262260437},{"id":"https://openalex.org/C63002673","wikidata":"https://www.wikidata.org/wiki/Q2260590","display_name":"Scoring rule","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26930001378059387},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2619999945163727}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:pure.atira.dk:openaire/b4929c91-b7bc-476c-b1ff-a7570623bc56","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2603.00208","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Andersen, A K, Mehdizavareh, M H, Khan, A, Becher, T, Britsch, S, Britsch, M, B\u00f6ttcher, M, Winther, S, Rohde, P D, Jensen, M H & Cichosz, S L 2026 'Tipping the Balance : Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models' arXiv. https://doi.org/10.48550/arXiv.2603.00208","raw_type":"workingPaper"},{"id":"pmh:oai:pure.atira.dk:publications/b4929c91-b7bc-476c-b1ff-a7570623bc56","is_oa":true,"landing_page_url":"https://vbn.aau.dk/da/publications/b4929c91-b7bc-476c-b1ff-a7570623bc56","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Andersen, A K, Mehdizavareh, M H, Khan, A, Becher, T, Britsch, S, Britsch, M, B\u00f6ttcher, M, Winther, S, Rohde, P D, Jensen, M H & Cichosz, S L 2026 'Tipping the Balance : Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models' arXiv. https://doi.org/10.48550/arXiv.2603.00208","raw_type":"workingPaper"},{"id":"doi:10.48550/arxiv.2603.00208","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00208","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire/b4929c91-b7bc-476c-b1ff-a7570623bc56","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2603.00208","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Andersen, A K, Mehdizavareh, M H, Khan, A, Becher, T, Britsch, S, Britsch, M, B\u00f6ttcher, M, Winther, S, Rohde, P D, Jensen, M H & Cichosz, S L 2026 'Tipping the Balance : Impact of Class Imbalance Correction on the Performance of Clinical Risk Prediction Models' arXiv. https://doi.org/10.48550/arXiv.2603.00208","raw_type":"workingPaper"},"sustainable_development_goals":[{"score":0.6663110852241516,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Objective:":[0],"ML-based":[1],"clinical":[2,55,60,220],"risk":[3,208],"prediction":[4,56,221],"models":[5,78,142],"are":[6,18],"increasingly":[7],"used":[8,45,96,224],"to":[9,21,141,188],"support":[10],"decision-making":[11],"in":[12,25,131,172,198,233],"healthcare.":[13],"While":[14],"class-imbalance":[15,98,225],"correction":[16,99,182,226],"techniques":[17,227],"commonly":[19,95,223],"applied":[20],"improve":[22],"model":[23,74,120],"performance":[24],"settings":[26],"with":[27,161,238],"rare":[28],"outcomes,":[29],"their":[30],"impact":[31,126],"on":[32,48,88,107,127,144],"probabilistic":[33,193],"calibration":[34,52,113,176,199],"remains":[35],"insufficiently":[36],"understood.":[37],"This":[38],"study":[39],"evaluated":[40],"the":[41,89,132,145,175],"effect":[42],"of":[43,206,218],"widely":[44],"resampling":[46,122,163,171],"strategies":[47,100],"both":[49],"discrimination":[50,111,234],"and":[51,66,79,92,112,119,150,195,201,235],"across":[53],"real-world":[54,219],"tasks.":[57],"Methods:":[58],"Ten":[59],"datasets":[61,118],"spanning":[62],"diverse":[63,216],"medical":[64],"domains":[65],"including":[67,76],"605,842":[68],"patients":[69],"were":[70,83,86,148,236],"analyzed.":[71],"Multiple":[72],"machine-learning":[73],"families,":[75,121],"linear":[77],"several":[80],"non-linear":[81],"approaches,":[82],"evaluated.":[84],"Models":[85,178],"trained":[87,143,179],"original":[90,146],"data":[91,109,147],"under":[93],"three":[94],"1:1":[97],"(SMOTE,":[101],"RUS,":[102],"ROS).":[103],"Performance":[104],"was":[105],"assessed":[106],"held-out":[108],"using":[110,180],"metrics.":[114],"Results:":[115],"Across":[116],"all":[117],"had":[123],"no":[124,162],"positive":[125],"predictive":[128],"performance.":[129,177,212],"Changes":[130],"Receiver":[133],"Operating":[134],"Characteristic":[135],"Area":[136],"Under":[137],"Curve":[138],"(ROC-AUC)":[139],"relative":[140],"small":[149],"inconsistent":[151],"(ROS:":[152],"-0.002,":[153],"p&lt;0.05;":[154],"RUS:":[155],"-0.004,":[156],"p&gt;0.05;":[157],"SMOTE:":[158],"-0.01,":[159],"p&lt;0.05),":[160,190],"strategy":[164],"demonstrating":[165],"a":[166,215],"systematic":[167,204],"improvement.":[168],"In":[169,214],"contrast,":[170],"general":[173],"degraded":[174,239],"imbalance":[181],"exhibited":[183],"higher":[184],"Brier":[185],"scores":[186],"(0.029":[187],"0.080,":[189],"reflecting":[191],"poorer":[192],"accuracy,":[194],"marked":[196],"deviations":[197],"intercept":[200],"slope,":[202],"indicating":[203],"distortions":[205],"predicted":[207],"despite":[209],"preserved":[210],"rank-based":[211],"Conclusion:":[213],"set":[217],"tasks,":[222],"did":[228],"not":[229],"provide":[230],"generalizable":[231],"improvements":[232],"associated":[237],"calibration.":[240]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-04T00:00:00"}
