{"id":"https://openalex.org/W7123672893","doi":"https://doi.org/10.48550/arxiv.2601.07003","title":"Unity Forests: Improving Interaction Modelling and Interpretability in Random Forests","display_name":"Unity Forests: Improving Interaction Modelling and Interpretability in Random Forests","publication_year":2026,"publication_date":"2026-01-11","ids":{"openalex":"https://openalex.org/W7123672893","doi":"https://doi.org/10.48550/arxiv.2601.07003"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.07003","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.07003","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.07003","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048970390","display_name":"Roman Hornung","orcid":"https://orcid.org/0000-0002-6036-1495"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]},{"id":"https://openalex.org/I169724904","display_name":"Zimmer Biomet (Netherlands)","ror":"https://ror.org/034k8cv93","country_code":"NL","type":"company","lineage":["https://openalex.org/I169724904","https://openalex.org/I4210115238"]},{"id":"https://openalex.org/I4403386549","display_name":"Munich Center for Machine Learning","ror":"https://ror.org/02nfy3535","country_code":null,"type":"education","lineage":["https://openalex.org/I4403386549","https://openalex.org/I62916508","https://openalex.org/I8204097"]}],"countries":["DE","NL"],"is_corresponding":true,"raw_author_name":"Hornung, Roman","raw_affiliation_strings":["Institute for Medical Information Processing, Biometry and Epidemiology, Faculty of Medicine, Ludwig Maximilian University of Munich","Munich Center for Machine Learning"],"affiliations":[{"raw_affiliation_string":"Institute for Medical Information Processing, Biometry and Epidemiology, Faculty of Medicine, Ludwig Maximilian University of Munich","institution_ids":["https://openalex.org/I169724904","https://openalex.org/I8204097"]},{"raw_affiliation_string":"Munich Center for Machine Learning","institution_ids":["https://openalex.org/I4403386549"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042014267","display_name":"Alexander Hapfelmeier","orcid":"https://orcid.org/0000-0001-6765-6352"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Hapfelmeier, Alexander","raw_affiliation_strings":["Institute of General Practice and Health Services Research, Department Clinical Medicine, TUM School of Medicine and Health, Technical University of Munich","Institute of AI and Informatics in Medicine, TUM School of Medicine and Health, Technical University of Munich"],"affiliations":[{"raw_affiliation_string":"Institute of General Practice and Health Services Research, Department Clinical Medicine, TUM School of Medicine and Health, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Institute of AI and Informatics in Medicine, TUM School of Medicine and Health, Technical University of Munich","institution_ids":["https://openalex.org/I62916508"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5048970390"],"corresponding_institution_ids":["https://openalex.org/I8204097","https://openalex.org/I169724904","https://openalex.org/I4403386549"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12417","display_name":"Morphological variations and asymmetry","score":0.14249999821186066,"subfield":{"id":"https://openalex.org/subfields/2608","display_name":"Geometry and Topology"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12417","display_name":"Morphological variations and asymmetry","score":0.14249999821186066,"subfield":{"id":"https://openalex.org/subfields/2608","display_name":"Geometry and Topology"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.08449999988079071,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.07999999821186066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.9427000284194946},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.7925999760627747},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7314000129699707},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.60589998960495},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.6021999716758728},{"id":"https://openalex.org/keywords/recursive-partitioning","display_name":"Recursive partitioning","score":0.4675000011920929},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.43810001015663147},{"id":"https://openalex.org/keywords/remainder","display_name":"Remainder","score":0.3646000027656555}],"concepts":[{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.9427000284194946},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.7925999760627747},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7314000129699707},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6212000250816345},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.60589998960495},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.6021999716758728},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.5482000112533569},{"id":"https://openalex.org/C137345334","wikidata":"https://www.wikidata.org/wiki/Q7303350","display_name":"Recursive partitioning","level":2,"score":0.4675000011920929},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.43810001015663147},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3675000071525574},{"id":"https://openalex.org/C39613435","wikidata":"https://www.wikidata.org/wiki/Q846677","display_name":"Remainder","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.3531999886035919},{"id":"https://openalex.org/C197656967","wikidata":"https://www.wikidata.org/wiki/Q17058458","display_name":"Marginal model","level":3,"score":0.3361000120639801},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.32409998774528503},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3188999891281128},{"id":"https://openalex.org/C165216359","wikidata":"https://www.wikidata.org/wiki/Q670653","display_name":"Marginal distribution","level":3,"score":0.3093000054359436},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28349998593330383},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27889999747276306},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26919999718666077},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2639999985694885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.07003","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.07003","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.07003","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.07003","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7154006958007812,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Random":[0],"forests":[1,50],"(RFs)":[2],"are":[3,13,29,33,74,131,142],"widely":[4],"used":[5],"for":[6],"prediction":[7],"and":[8,12,171,218,239],"variable":[9,100],"importance":[10,101],"analysis":[11],"often":[14],"believed":[15],"to":[16,56,82],"capture":[17],"any":[18],"types":[19,234],"of":[20,71,121],"interactions":[21,32,59],"via":[22],"recursive":[23],"splitting.":[24],"However,":[25],"since":[26],"the":[27,67,90,98,113,126,155,176,195,230],"splits":[28,70,124],"chosen":[30],"locally,":[31],"only":[34,117,144],"reliably":[35,198,235],"captured":[36],"when":[37],"at":[38],"least":[39],"one":[40],"involved":[41],"covariate":[42,80,151,170,186],"has":[43,187],"a":[44,78,84,118,146,192,210,244],"marginal":[45,63,179,203],"effect.":[46],"We":[47,95],"introduce":[48,159],"unity":[49,99,196],"(UFOs),":[51],"an":[52,149],"RF":[53],"variant":[54],"designed":[55],"better":[57],"exploit":[58],"involving":[60],"covariates":[61,137,201],"without":[62,202],"effects.":[64,190],"In":[65,191,209],"UFOs,":[66],"first":[68],"few":[69],"each":[72,185],"tree":[73,114,122,161,167],"optimized":[75],"jointly":[76],"across":[77],"random":[79],"subset":[81],"form":[83],"\"tree":[85],"root\"":[86],"capturing":[87],"such":[88],"interactions;":[89],"remainder":[91],"is":[92,105],"grown":[93],"conventionally.":[94],"further":[96],"propose":[97],"measure":[102],"(VIM),":[103],"which":[104,164,184],"based":[106],"on":[107],"out-of-bag":[108],"split":[109,147],"criterion":[110,129],"values":[111,130],"from":[112],"roots.":[115],"Here,":[116],"small":[119],"fraction":[120],"root":[123],"with":[125,138,224],"highest":[127],"in-bag":[128],"considered":[132],"per":[133,169],"covariate,":[134],"reflecting":[135],"that":[136],"purely":[139],"interaction-based":[140],"effects":[141],"discriminative":[143],"if":[145],"in":[148,154,236,243],"interacting":[150,200],"occurred":[152],"earlier":[153],"tree.":[156],"Finally,":[157],"we":[158],"covariate-representative":[160],"roots":[162,168],"(CRTRs),":[163],"select":[165],"representative":[166],"provide":[172],"interpretable":[173],"insight":[174],"into":[175],"conditions":[177],"-":[178,182],"or":[180],"interactive":[181],"under":[183],"its":[188],"strongest":[189],"simulation":[193],"study,":[194],"VIM":[197],"identified":[199],"effects,":[204],"unlike":[205],"conventional":[206],"RF-based":[207],"VIMs.":[208],"large-scale":[211],"real-data":[212],"comparison,":[213],"UFOs":[214],"achieved":[215],"higher":[216],"discrimination":[217],"predictive":[219],"accuracy":[220],"than":[221],"standard":[222],"RFs,":[223],"comparable":[225],"calibration.":[226],"The":[227],"CRTRs":[228],"reproduced":[229],"covariates'":[231],"true":[232],"effect":[233],"simulated":[237],"data":[238,246],"provided":[240],"interesting":[241],"insights":[242],"real":[245],"analysis.":[247]},"counts_by_year":[],"updated_date":"2026-01-14T23:44:37.837170","created_date":"2026-01-14T00:00:00"}
