{"id":"https://openalex.org/W7102414427","doi":"https://doi.org/10.48550/arxiv.2510.23624","title":"DiNo and RanBu: Lightweight Predictions from Shallow Random Forests","display_name":"DiNo and RanBu: Lightweight Predictions from Shallow Random Forests","publication_year":2025,"publication_date":"2025-10-23","ids":{"openalex":"https://openalex.org/W7102414427","doi":"https://doi.org/10.48550/arxiv.2510.23624"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2510.23624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.23624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2510.23624","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Santos, Tiago Mendon\u00e7a dos","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Santos, Tiago Mendon\u00e7a dos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Izbicki, Rafael","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Izbicki, Rafael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Esteves, Lu\u00eds Gustavo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Esteves, Lu\u00eds Gustavo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5554999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5554999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.04989999905228615,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.035999998450279236,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.628000020980835},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6169999837875366},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46480000019073486},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.45840001106262207},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4334999918937683},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.43070000410079956},{"id":"https://openalex.org/keywords/quantile","display_name":"Quantile","score":0.38109999895095825},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.38029998540878296}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6783999800682068},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.628000020980835},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6169999837875366},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46480000019073486},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.45840001106262207},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4334999918937683},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.43070000410079956},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3824999928474426},{"id":"https://openalex.org/C118671147","wikidata":"https://www.wikidata.org/wiki/Q578714","display_name":"Quantile","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.38029998540878296},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.373199999332428},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34850001335144043},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32089999318122864},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3142000138759613},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.31360000371932983},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.2606000006198883},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2510.23624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.23624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2510.23624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.23624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Life in Land","score":0.5369758009910583,"id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Random":[0],"Forest":[1],"ensembles":[2],"are":[3,93],"a":[4,50,148],"strong":[5],"baseline":[6],"for":[7,189],"tabular":[8,180],"prediction":[9],"tasks,":[10],"but":[11],"their":[12],"reliance":[13],"on":[14,178],"hundreds":[15],"of":[16,53,70,97,122],"deep":[17],"trees":[18,55,92],"often":[19],"results":[20],"in":[21,30,126,144],"high":[22],"inference":[23,132],"latency":[24],"and":[25,41,95,112],"memory":[26],"demands,":[27],"limiting":[28],"deployment":[29],"latency-sensitive":[31],"or":[32,118],"resource-constrained":[33],"environments.":[34],"We":[35,176],"introduce":[36],"DiNo":[37,60,138],"(Distance":[38],"with":[39,161],"Nodes)":[40],"RanBu":[42,74,116],"(Random":[43],"Bushes),":[44],"two":[45],"shallow-forest":[46],"methods":[47,153],"that":[48],"convert":[49],"small":[51],"set":[52],"depth-limited":[54],"into":[56],"efficient,":[57],"distance-weighted":[58],"predictors.":[59],"measures":[61],"cophenetic":[62],"distances":[63],"via":[64],"the":[65,98,120,140],"most":[66],"recent":[67],"common":[68],"ancestor":[69],"observation":[71],"pairs,":[72],"while":[73],"applies":[75],"kernel":[76],"smoothing":[77],"to":[78,136,156,186],"Breiman's":[79],"classical":[80],"proximity":[81],"measure.":[82],"Both":[83,152],"approaches":[84],"operate":[85],"entirely":[86],"after":[87],"forest":[88],"training:":[89],"no":[90],"additional":[91],"grown,":[94],"tuning":[96],"single":[99],"bandwidth":[100],"parameter":[101],"$h$":[102],"requires":[103],"only":[104],"lightweight":[105],"matrix-vector":[106],"operations.":[107],"Across":[108],"three":[109],"synthetic":[110],"benchmarks":[111],"25":[113],"public":[114],"datasets,":[115],"matches":[117],"exceeds":[119],"accuracy":[121,160],"full-depth":[123],"random":[124,181],"forests-particularly":[125],"high-noise":[127],"settings-while":[128],"reducing":[129],"training":[130],"plus":[131],"time":[133],"by":[134],"up":[135],"95\\%.":[137],"achieves":[139],"best":[141],"bias-variance":[142],"trade-off":[143],"low-noise":[145],"regimes":[146],"at":[147,174],"modest":[149],"computational":[150],"cost.":[151],"extend":[154],"directly":[155],"quantile":[157],"regression,":[158],"maintaining":[159],"substantial":[162],"speed":[163],"gains.":[164],"The":[165],"implementation":[166],"is":[167],"available":[168],"as":[169],"an":[170],"open-source":[171],"R/C++":[172],"package":[173],"https://github.com/tiagomendonca/dirf.":[175],"focus":[177],"structured":[179],"samples":[182],"(i.i.d.),":[183],"leaving":[184],"extensions":[185],"other":[187],"modalities":[188],"future":[190],"work.":[191]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-30T00:00:00"}
