{"id":"https://openalex.org/W4401209986","doi":"https://doi.org/10.1007/s10994-024-06584-1","title":"Autoreplicative random forests with applications to missing value imputation","display_name":"Autoreplicative random forests with applications to missing value imputation","publication_year":2024,"publication_date":"2024-08-01","ids":{"openalex":"https://openalex.org/W4401209986","doi":"https://doi.org/10.1007/s10994-024-06584-1"},"language":"en","primary_location":{"id":"doi:10.1007/s10994-024-06584-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06584-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06584-1.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06584-1.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102413090","display_name":"Ekaterina Antonenko","orcid":null},"institutions":[{"id":"https://openalex.org/I142476485","display_name":"\u00c9cole Polytechnique","ror":"https://ror.org/05hy3tk52","country_code":"FR","type":"education","lineage":["https://openalex.org/I142476485","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I154526488","display_name":"Inserm","ror":"https://ror.org/02vjkv261","country_code":"FR","type":"government","lineage":["https://openalex.org/I154526488"]},{"id":"https://openalex.org/I2746051580","display_name":"Universit\u00e9 Paris Sciences et Lettres","ror":"https://ror.org/013cjyk83","country_code":"FR","type":"education","lineage":["https://openalex.org/I2746051580"]},{"id":"https://openalex.org/I4210139461","display_name":"Laboratoire d'Informatique de l'\u00c9cole Polytechnique","ror":"https://ror.org/04afed728","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I142476485","https://openalex.org/I4210139461","https://openalex.org/I4210145102","https://openalex.org/I4210159245"]},{"id":"https://openalex.org/I80043","display_name":"Institut Curie","ror":"https://ror.org/04t0gwh46","country_code":"FR","type":"nonprofit","lineage":["https://openalex.org/I80043"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Ekaterina Antonenko","raw_affiliation_strings":["INSERM, U900, 75005, Paris, France","Institut Curie, PSL Research University, 75005, Paris, France","LIX, Ecole Polytechnique, IP Paris, 91120, Palaiseau, France","Mines Paris, CBIO-Centre for Computational Biology, PSL Research University, 75006, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INSERM, U900, 75005, Paris, France","institution_ids":["https://openalex.org/I154526488"]},{"raw_affiliation_string":"Institut Curie, PSL Research University, 75005, Paris, France","institution_ids":["https://openalex.org/I2746051580","https://openalex.org/I80043"]},{"raw_affiliation_string":"LIX, Ecole Polytechnique, IP Paris, 91120, Palaiseau, France","institution_ids":["https://openalex.org/I4210139461","https://openalex.org/I142476485"]},{"raw_affiliation_string":"Mines Paris, CBIO-Centre for Computational Biology, PSL Research University, 75006, Paris, France","institution_ids":["https://openalex.org/I2746051580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026274833","display_name":"Ander Carre\u00f1o","orcid":"https://orcid.org/0000-0002-1552-171X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ander Carre\u00f1o","raw_affiliation_strings":["Quant AI Lab, 28043, Madrid, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Quant AI Lab, 28043, Madrid, Spain","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055668668","display_name":"Jesse Read","orcid":"https://orcid.org/0000-0002-1013-6724"},"institutions":[{"id":"https://openalex.org/I142476485","display_name":"\u00c9cole Polytechnique","ror":"https://ror.org/05hy3tk52","country_code":"FR","type":"education","lineage":["https://openalex.org/I142476485","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210139461","display_name":"Laboratoire d'Informatique de l'\u00c9cole Polytechnique","ror":"https://ror.org/04afed728","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I142476485","https://openalex.org/I4210139461","https://openalex.org/I4210145102","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jesse Read","raw_affiliation_strings":["LIX, Ecole Polytechnique, IP Paris, 91120, Palaiseau, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LIX, Ecole Polytechnique, IP Paris, 91120, Palaiseau, France","institution_ids":["https://openalex.org/I4210139461","https://openalex.org/I142476485"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102413090"],"corresponding_institution_ids":["https://openalex.org/I142476485","https://openalex.org/I154526488","https://openalex.org/I2746051580","https://openalex.org/I4210139461","https://openalex.org/I80043"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.972,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.79508627,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"113","issue":"10","first_page":"7617","last_page":"7643"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9833999872207642,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.8685398101806641},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.8464477062225342},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7147976160049438},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.6152901649475098},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6131358742713928},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5533617734909058},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5001976490020752},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.46431753039360046},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4631248414516449}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.8685398101806641},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.8464477062225342},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7147976160049438},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.6152901649475098},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6131358742713928},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5533617734909058},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5001976490020752},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.46431753039360046},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4631248414516449}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s10994-024-06584-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06584-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06584-1.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-05000324v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05000324","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning, 2024, 113 (10), pp.7617-7643. &#x27E8;10.1007/s10994-024-06584-1&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":{"id":"doi:10.1007/s10994-024-06584-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06584-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06584-1.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4401209986.pdf","grobid_xml":"https://content.openalex.org/works/W4401209986.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W1678889691","https://openalex.org/W1953606363","https://openalex.org/W1999954155","https://openalex.org/W2000769684","https://openalex.org/W2025768430","https://openalex.org/W2032997274","https://openalex.org/W2049633694","https://openalex.org/W2052684427","https://openalex.org/W2064186732","https://openalex.org/W2096863518","https://openalex.org/W2115098571","https://openalex.org/W2146241755","https://openalex.org/W2153491803","https://openalex.org/W2165363188","https://openalex.org/W2286147163","https://openalex.org/W2404281525","https://openalex.org/W2807827562","https://openalex.org/W2897574832","https://openalex.org/W2908849044","https://openalex.org/W2956663245","https://openalex.org/W3096627802","https://openalex.org/W3197494818","https://openalex.org/W3212610181","https://openalex.org/W4212774754","https://openalex.org/W4287509530","https://openalex.org/W4367397006","https://openalex.org/W6675354045","https://openalex.org/W6848653560","https://openalex.org/W6887894044"],"related_works":["https://openalex.org/W2181530120","https://openalex.org/W4211215373","https://openalex.org/W2024529227","https://openalex.org/W2055961818","https://openalex.org/W1574575415","https://openalex.org/W3144172081","https://openalex.org/W3179858851","https://openalex.org/W3028371478","https://openalex.org/W2081476516","https://openalex.org/W2581984549"],"abstract_inverted_index":{"Missing":[0],"values":[1,16,152],"are":[2,35,153],"a":[3,18,36,80,91,165,168],"common":[4],"problem":[5],"in":[6,41,87,167],"data":[7,27],"science":[8],"and":[9,107,116,134],"machine":[10],"learning.":[11],"Removing":[12],"instances":[13],"with":[14],"missing":[15,46,140],"is":[17,113],"straightforward":[19],"workaround,":[20],"but":[21],"this":[22,71],"can":[23],"significantly":[24],"hinder":[25],"subsequent":[26],"analysis,":[28],"particularly":[29],"when":[30],"features":[31],"outnumber":[32],"instances.":[33],"There":[34],"variety":[37],"of":[38,90,163],"methodologies":[39],"proposed":[40,139],"the":[42,88,138,150,161],"literature":[43],"for":[44,50,56],"imputing":[45],"values.":[47],"Denoising":[48],"Autoencoders,":[49],"example,":[51],"have":[52,62],"been":[53,63],"leveraged":[54],"efficiently":[55],"imputation.":[57],"However,":[58],"neural":[59,125],"network":[60,126],"approaches":[61],"relatively":[64],"less":[65],"effective":[66],"on":[67,104],"smaller":[68],"datasets.":[69],"In":[70,128],"work,":[72],"we":[73,85,144],"propose":[74,146],"Autoreplicative":[75],"Random":[76],"Forests":[77],"(ARF)":[78],"as":[79],"multi-output":[81],"learning":[82],"approach,":[83],"which":[84],"introduce":[86],"context":[89],"framework":[92,166],"that":[93,111],"may":[94],"impute":[95],"via":[96],"either":[97],"an":[98],"iterative":[99],"or":[100],"procedural":[101],"process.":[102],"Experiments":[103],"several":[105],"low-":[106],"high-dimensional":[108],"datasets":[109],"show":[110],"ARF":[112],"computationally":[114],"efficient":[115],"exhibits":[117],"better":[118],"imputation":[119,142,157],"performance":[120],"than":[121],"its":[122],"competitors,":[123],"including":[124],"approaches.":[127],"order":[129],"to":[130,137],"provide":[131],"statistical":[132],"analysis":[133],"mathematical":[135],"background":[136],"value":[141],"framework,":[143],"also":[145],"probabilistic":[147],"ARFs,":[148],"where":[149],"confidence":[151],"provided":[154],"over":[155],"different":[156],"hypotheses,":[158],"therefore":[159],"maximizing":[160],"utility":[162],"such":[164],"machine-learning":[169],"pipeline":[170],"targeting":[171],"predictive":[172],"performance.":[173]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
