{"id":"https://openalex.org/W7117531138","doi":"https://doi.org/10.48550/arxiv.2512.21602","title":"An Empirical Study of Machine Learning Robustness and Scalability for Imbalanced Tabular Clinical Data in Emergency and Critical Care","display_name":"An Empirical Study of Machine Learning Robustness and Scalability for Imbalanced Tabular Clinical Data in Emergency and Critical Care","publication_year":2025,"publication_date":"2025-12-25","ids":{"openalex":"https://openalex.org/W7117531138","doi":"https://doi.org/10.48550/arxiv.2512.21602"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.21602","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21602","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.21602","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068589144","display_name":"Yusuf Brima","orcid":"https://orcid.org/0000-0002-9975-8676"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brima, Yusuf","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5090363326","display_name":"Marcellin Atemkeng","orcid":"https://orcid.org/0000-0002-9020-3885"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Atemkeng, Marcellin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.5002999901771545,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.5002999901771545,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.2379000037908554,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.05299999937415123,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7889000177383423},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7709000110626221},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.5054000020027161},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.4699999988079071},{"id":"https://openalex.org/keywords/ensemble-forecasting","display_name":"Ensemble forecasting","score":0.4505999982357025},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.38420000672340393},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.3643999993801117}],"concepts":[{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7978000044822693},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7889000177383423},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7709000110626221},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7278000116348267},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6699000000953674},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.4699999988079071},{"id":"https://openalex.org/C119898033","wikidata":"https://www.wikidata.org/wiki/Q3433888","display_name":"Ensemble forecasting","level":2,"score":0.4505999982357025},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.38420000672340393},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.3643999993801117},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.3285999894142151},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.32760000228881836},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3176000118255615},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C122342681","wikidata":"https://www.wikidata.org/wiki/Q330828","display_name":"Skewness","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2563999891281128}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.21602","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21602","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.21602","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21602","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Every":[0],"year,":[1],"millions":[2],"of":[3,29],"patients":[4],"pass":[5],"through":[6],"emergency":[7],"departments":[8],"and":[9,22,32,48,54,79,89,123,139,180],"intensive":[10],"care":[11],"units,":[12],"where":[13],"clinicians":[14],"must":[15],"make":[16],"high-stakes":[17],"decisions":[18],"under":[19,177],"time":[20],"pressure":[21],"uncertainty.":[23],"Machine":[24],"learning":[25],"could":[26],"support":[27],"prediction":[28,129],"deterioration,":[30],"triage,":[31],"rare":[33],"critical":[34],"outcomes,":[35],"but":[36],"clinical":[37,59,128,216,241],"data":[38,61,75],"are":[39,222],"often":[40],"severely":[41],"imbalanced,":[42],"biasing":[43],"models":[44,56,93,102,165,199,221],"toward":[45],"majority":[46],"classes":[47],"reducing":[49],"predictive":[50],"performance.":[51,168],"Developing":[52],"robust":[53],"efficient":[55],"for":[57],"imbalanced":[58,73],"tabular":[60,74,219],"therefore":[62],"remains":[63],"an":[64],"important":[65],"challenge.":[66],"We":[67],"evaluated":[68,104],"six":[69],"model":[70,211],"families":[71],"on":[72],"from":[76],"the":[77,142,174,181,224],"MIMIC-IV-ED":[78],"eICU":[80],"databases:":[81],"Decision":[82],"Tree,":[83],"Random":[84],"Forest,":[85],"XGBoost,":[86],"TabNet,":[87],"TabICL,":[88],"TabPFN":[90,137],"v2.6.":[91],"Trainable":[92],"were":[94,103,114],"optimized":[95],"using":[96,116],"Bayesian":[97],"hyperparameter":[98],"tuning,":[99],"while":[100,163,197,231],"foundation":[101,164,198,220],"in":[105],"their":[106],"pretrained":[107],"inference":[108],"regime":[109],"without":[110],"task-specific":[111],"reweighting.":[112],"Models":[113],"assessed":[115],"Macro":[117,145],"F1-score,":[118],"robustness":[119],"to":[120],"increasing":[121,178],"imbalance,":[122],"computational":[124,183],"scalability":[125],"across":[126,133,214],"seven":[127],"tasks.":[130],"Results":[131],"differed":[132],"datasets.":[134],"On":[135,152],"MIMIC-IV-ED,":[136],"v2.6":[138],"TabICL":[140],"achieved":[141,166],"strongest":[143],"average":[144],"F1":[146],"ranks,":[147],"with":[148,194,227],"XGBoost":[149,154],"remaining":[150],"competitive.":[151],"eICU,":[153],"consistently":[155],"performed":[156],"best,":[157],"followed":[158],"by":[159],"other":[160],"tree-based":[161,189],"methods,":[162],"intermediate":[167],"Across":[169],"both":[170],"datasets,":[171],"TabNet":[172],"showed":[173,187],"largest":[175],"degradation":[176],"imbalance":[179],"highest":[182],"cost.":[184,204],"Training-time":[185],"analysis":[186],"that":[188,208,237],"methods":[190],"scaled":[191],"most":[192],"favorably":[193],"dataset":[195],"size,":[196],"offered":[200],"low":[201],"per-task":[202],"adaptation":[203],"These":[205],"findings":[206],"suggest":[207],"no":[209],"single":[210],"family":[212],"dominates":[213],"all":[215],"settings.":[217],"However,":[218],"narrowing":[223],"performance":[225],"gap":[226],"strong":[228],"classical":[229],"baselines":[230],"offering":[232],"a":[233],"distinct":[234],"efficiency-performance":[235],"trade-off":[236],"may":[238],"benefit":[239],"resource-constrained":[240],"environments.":[242]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2025-12-30T00:00:00"}
