{"id":"https://openalex.org/W4388307524","doi":"https://doi.org/10.5334/dsj-2023-042","title":"A Notion of Feature Importance by Decorrelation and Detection of Trends by Random Forest Regression","display_name":"A Notion of Feature Importance by Decorrelation and Detection of Trends by Random Forest Regression","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4388307524","doi":"https://doi.org/10.5334/dsj-2023-042"},"language":"en","primary_location":{"id":"doi:10.5334/dsj-2023-042","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2023-042","pdf_url":"https://storage.googleapis.com/jnl-up-j-dsj-files/journals/1/articles/1585/6544c599b267b.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://storage.googleapis.com/jnl-up-j-dsj-files/journals/1/articles/1585/6544c599b267b.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084852770","display_name":"Yannick Gerstorfer","orcid":null},"institutions":[{"id":"https://openalex.org/I2801628138","display_name":"Frankfurt Institute for Advanced Studies","ror":"https://ror.org/05vmv8m79","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2801628138"]},{"id":"https://openalex.org/I114090438","display_name":"Goethe University Frankfurt","ror":"https://ror.org/04cvxnb49","country_code":"DE","type":"education","lineage":["https://openalex.org/I114090438"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Yannick Gerstorfer","raw_affiliation_strings":["Frankfurt Institute for Advanced Studies, Goethe University Frankfurt Frankfurt 60325"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Frankfurt Institute for Advanced Studies, Goethe University Frankfurt Frankfurt 60325","institution_ids":["https://openalex.org/I2801628138","https://openalex.org/I114090438"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082557348","display_name":"Max Hahn\u2010Klimroth","orcid":"https://orcid.org/0000-0002-3995-419X"},"institutions":[{"id":"https://openalex.org/I200332995","display_name":"TU Dortmund University","ror":"https://ror.org/01k97gp34","country_code":"DE","type":"education","lineage":["https://openalex.org/I200332995"]},{"id":"https://openalex.org/I114090438","display_name":"Goethe University Frankfurt","ror":"https://ror.org/04cvxnb49","country_code":"DE","type":"education","lineage":["https://openalex.org/I114090438"]},{"id":"https://openalex.org/I2801628138","display_name":"Frankfurt Institute for Advanced Studies","ror":"https://ror.org/05vmv8m79","country_code":"DE","type":"facility","lineage":["https://openalex.org/I2801628138"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Max Hahn-Klimroth","raw_affiliation_strings":["Frankfurt Institute for Advanced Studies, Goethe University Frankfurt Frankfurt 60325, Germany","Faculty of Computer Sciences, TU Dortmund University Dortmund 44227, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Frankfurt Institute for Advanced Studies, Goethe University Frankfurt Frankfurt 60325, Germany","institution_ids":["https://openalex.org/I2801628138","https://openalex.org/I114090438"]},{"raw_affiliation_string":"Faculty of Computer Sciences, TU Dortmund University Dortmund 44227, Germany","institution_ids":["https://openalex.org/I200332995"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029050486","display_name":"Lena Krieg","orcid":"https://orcid.org/0000-0002-5302-6955"},"institutions":[{"id":"https://openalex.org/I200332995","display_name":"TU Dortmund University","ror":"https://ror.org/01k97gp34","country_code":"DE","type":"education","lineage":["https://openalex.org/I200332995"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Lena Krieg","raw_affiliation_strings":["Faculty of Computer Sciences, TU Dortmund University Dortmund 44227"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computer Sciences, TU Dortmund University Dortmund 44227","institution_ids":["https://openalex.org/I200332995"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5029050486","https://openalex.org/A5084852770"],"corresponding_institution_ids":["https://openalex.org/I114090438","https://openalex.org/I200332995","https://openalex.org/I2801628138"],"apc_list":{"value":350,"currency":"GBP","value_usd":429},"apc_paid":{"value":887,"currency":"EUR","value_usd":956},"fwci":2.0221,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89495486,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"22","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9751999974250793,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9751999974250793,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9725000262260437,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.7751847505569458},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.761702299118042},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.6789862513542175},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6187808513641357},{"id":"https://openalex.org/keywords/tree-traversal","display_name":"Tree traversal","score":0.5610292553901672},{"id":"https://openalex.org/keywords/decorrelation","display_name":"Decorrelation","score":0.5436933636665344},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.5127914547920227},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49259740114212036},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.49127858877182007},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.4819778800010681},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.4819345474243164},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44931501150131226},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4414517283439636},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.356474906206131},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3170771598815918},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2978786826133728},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12018850445747375}],"concepts":[{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.7751847505569458},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.761702299118042},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.6789862513542175},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6187808513641357},{"id":"https://openalex.org/C140745168","wikidata":"https://www.wikidata.org/wiki/Q1210082","display_name":"Tree traversal","level":2,"score":0.5610292553901672},{"id":"https://openalex.org/C177860922","wikidata":"https://www.wikidata.org/wiki/Q788608","display_name":"Decorrelation","level":2,"score":0.5436933636665344},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.5127914547920227},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49259740114212036},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.49127858877182007},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.4819778800010681},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.4819345474243164},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44931501150131226},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4414517283439636},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.356474906206131},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3170771598815918},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2978786826133728},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12018850445747375},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5334/dsj-2023-042","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2023-042","pdf_url":"https://storage.googleapis.com/jnl-up-j-dsj-files/journals/1/articles/1585/6544c599b267b.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:ecaedd8c74a746cd9d1a9aca8cc40316","is_oa":true,"landing_page_url":"https://doaj.org/article/ecaedd8c74a746cd9d1a9aca8cc40316","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data Science Journal, Vol 22, Pp 42-42 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.5334/dsj-2023-042","is_oa":true,"landing_page_url":"https://doi.org/10.5334/dsj-2023-042","pdf_url":"https://storage.googleapis.com/jnl-up-j-dsj-files/journals/1/articles/1585/6544c599b267b.pdf","source":{"id":"https://openalex.org/S62969111","display_name":"Data Science Journal","issn_l":"1683-1470","issn":["1683-1470"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320511","host_organization_name":"Ubiquity Press","host_organization_lineage":["https://openalex.org/P4310320511"],"host_organization_lineage_names":["Ubiquity Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science Journal","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.75,"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388307524.pdf"},"referenced_works_count":17,"referenced_works":["https://openalex.org/W1985372952","https://openalex.org/W2025283258","https://openalex.org/W2093327464","https://openalex.org/W2124833832","https://openalex.org/W2138356150","https://openalex.org/W2182468807","https://openalex.org/W2194775991","https://openalex.org/W2618851150","https://openalex.org/W2911964244","https://openalex.org/W2962029365","https://openalex.org/W2969551072","https://openalex.org/W2970328536","https://openalex.org/W2982667388","https://openalex.org/W3044853528","https://openalex.org/W3126154634","https://openalex.org/W3126673261","https://openalex.org/W4385418145"],"related_works":["https://openalex.org/W1604939135","https://openalex.org/W2127058578","https://openalex.org/W2735368845","https://openalex.org/W2089764958","https://openalex.org/W2048488252","https://openalex.org/W4288365262","https://openalex.org/W2940614149","https://openalex.org/W4289884158","https://openalex.org/W2787485953","https://openalex.org/W3217432596"],"abstract_inverted_index":{"In":[0,128,152],"many":[1],"studies,":[2],"we":[3,18,155,171],"want":[4],"to":[5,65,103,144],"determine":[6,104,145],"the":[7,22,25,30,37,40,78,81,84,87,93,96,105,108,165,179,185,195],"influence":[8,26],"of":[9,24,69,77,80,107,114,160,197,202,208],"certain":[10],"features":[11],"on":[12,124,164,205],"a":[13,74,125,139,157,206],"dependent":[14,41,97],"variable.":[15,42],"More":[16,110],"specifically,":[17],"are":[19,73,122,134,138],"interested":[20],"in":[21,178],"strength":[23,79],"&ndash;":[27],"i.e.,":[28],"is":[29],"feature":[31,38,70,94,161],"relevant?":[32],"And,":[33],"if":[34],"so,":[35],"how":[36],"influences":[39],"Recently,":[43],"data-driven":[44],"approaches":[45],"such":[46],"as":[47],"random":[48,182],"forest":[49,183],"regression":[50],"have":[51],"found":[52],"their":[53],"way":[54],"into":[55],"applications":[56],"(Boulesteix":[57],"et":[58,149],"al.":[59,150],"2012).":[60],"These":[61],"models":[62,133],"allow":[63],"researchers":[64],"directly":[66],"derive":[67],"measures":[68],"importance,":[71],"which":[72,115],"natural":[75],"indicator":[76],"influence.":[82,109],"For":[83],"relevant":[85],"features,":[86,121],"correlation":[88,91],"or":[89],"rank":[90],"between":[92,120],"and":[95,141,188,210],"variable":[98],"has":[99],"typically":[100],"been":[101],"used":[102],"nature":[106],"recent":[111,140],"methods,":[112],"some":[113],"can":[116],"also":[117],"measure":[118],"interactions":[119],"based":[123,163],"modeling":[126],"approach.":[127],"particular,":[129],"when":[130],"machine":[131],"learning":[132],"used,":[135],"SHAP":[136],"scores":[137],"prominent":[142],"method":[143],"these":[146],"trends":[147,177],"(Lundberg":[148],"2017).":[151],"this":[153],"paper,":[154],"introduce":[156],"novel":[158],"notion":[159],"importance":[162],"well-studied":[166],"Gram-Schmidt":[167],"decorrelation":[168],"method.":[169],"Furthermore,":[170],"propose":[172],"two":[173],"estimators":[174,199,204],"for":[175],"identifying":[176],"data":[180],"using":[181],"regression,":[184],"so-called":[186],"absolute":[187],"relative":[189],"traversal":[190],"rate.":[191],"We":[192],"empirically":[193],"compare":[194],"properties":[196],"our":[198],"with":[200],"those":[201],"well-established":[203],"variety":[207],"synthetic":[209],"real-world":[211],"datasets.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
