{"id":"https://openalex.org/W2167848975","doi":"https://doi.org/10.1142/s021972001100546x","title":"CLASSIFICATION OF LARGE MICROARRAY DATASETS USING FAST RANDOM FOREST CONSTRUCTION","display_name":"CLASSIFICATION OF LARGE MICROARRAY DATASETS USING FAST RANDOM FOREST CONSTRUCTION","publication_year":2011,"publication_date":"2011-04-01","ids":{"openalex":"https://openalex.org/W2167848975","doi":"https://doi.org/10.1142/s021972001100546x","mag":"2167848975","pmid":"https://pubmed.ncbi.nlm.nih.gov/21523931"},"language":"en","primary_location":{"id":"doi:10.1142/s021972001100546x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021972001100546x","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025398249","display_name":"Elena Manilich","orcid":null},"institutions":[{"id":"https://openalex.org/I1316902750","display_name":"Cleveland Clinic","ror":"https://ror.org/03xjacd83","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1316902750"]},{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"ELENA A. MANILICH","raw_affiliation_strings":["Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USA","Digestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA","Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USADigestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USA","institution_ids":["https://openalex.org/I58956616"]},{"raw_affiliation_string":"Digestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA","institution_ids":["https://openalex.org/I1316902750"]},{"raw_affiliation_string":"Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USADigestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA","institution_ids":["https://openalex.org/I58956616","https://openalex.org/I1316902750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013424429","display_name":"Z. Meral \u00d6zsoyo\u011flu","orcid":null},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Z. MERAL \u00d6ZSOYO\u01e6LU","raw_affiliation_strings":["Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Case Western Reserve University, Cleveland, Ohio 44106, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071984723","display_name":"VALERIY TRUBACHEV","orcid":null},"institutions":[{"id":"https://openalex.org/I1316902750","display_name":"Cleveland Clinic","ror":"https://ror.org/03xjacd83","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1316902750"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"VALERIY TRUBACHEV","raw_affiliation_strings":["Digestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA"],"affiliations":[{"raw_affiliation_string":"Digestive Disease Institute, Cleveland Clinic Cleveland, Ohio 44195, USA","institution_ids":["https://openalex.org/I1316902750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063314967","display_name":"Tomas Radivoyevitch","orcid":"https://orcid.org/0000-0002-9701-1851"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"TOMAS RADIVOYEVITCH","raw_affiliation_strings":["Department of Epidemiology and Biostatistics, Case Western Reserve University, Cleveland, Ohio 44106, USA"],"affiliations":[{"raw_affiliation_string":"Department of Epidemiology and Biostatistics, Case Western Reserve University, Cleveland, Ohio 44106, USA","institution_ids":["https://openalex.org/I58956616"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5025398249"],"corresponding_institution_ids":["https://openalex.org/I1316902750","https://openalex.org/I58956616"],"apc_list":null,"apc_paid":null,"fwci":0.912,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.74040094,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"09","issue":"02","first_page":"251","last_page":"267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9850000143051147,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.8993359804153442},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7420789003372192},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6349905729293823},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.607297956943512},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5404018759727478},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.5120251774787903},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5002584457397461},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.43393978476524353},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.394363135099411},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17512771487236023}],"concepts":[{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.8993359804153442},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7420789003372192},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6349905729293823},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.607297956943512},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5404018759727478},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.5120251774787903},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5002584457397461},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.43393978476524353},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.394363135099411},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17512771487236023},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000401","qualifier_name":"mortality","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000401","qualifier_name":"mortality","is_major_topic":false},{"descriptor_ui":"D016403","descriptor_name":"Lymphoma, Large B-Cell, Diffuse","qualifier_ui":"Q000401","qualifier_name":"mortality","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D046228","descriptor_name":"Microarray Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D046228","descriptor_name":"Microarray Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D046228","descriptor_name":"Microarray Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D053208","descriptor_name":"Kaplan-Meier Estimate","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D053208","descriptor_name":"Kaplan-Meier Estimate","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D053208","descriptor_name":"Kaplan-Meier Estimate","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1142/s021972001100546x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021972001100546x","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},{"id":"pmid:21523931","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/21523931","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of bioinformatics and computational biology","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","score":0.6800000071525574,"display_name":"Life in Land"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W273955616","https://openalex.org/W1483135265","https://openalex.org/W1520812622","https://openalex.org/W1539593569","https://openalex.org/W1570448133","https://openalex.org/W1576962511","https://openalex.org/W1594031697","https://openalex.org/W1637435380","https://openalex.org/W1976564639","https://openalex.org/W2014216829","https://openalex.org/W2030922238","https://openalex.org/W2033533336","https://openalex.org/W2050997351","https://openalex.org/W2064208261","https://openalex.org/W2070796617","https://openalex.org/W2086099578","https://openalex.org/W2119842880","https://openalex.org/W2140065103","https://openalex.org/W2147246240","https://openalex.org/W2148654292","https://openalex.org/W2911964244","https://openalex.org/W3085162807","https://openalex.org/W4252240993"],"related_works":["https://openalex.org/W2187546663","https://openalex.org/W148745890","https://openalex.org/W2899790217","https://openalex.org/W2429057255","https://openalex.org/W2889302474","https://openalex.org/W4323294312","https://openalex.org/W4366990902","https://openalex.org/W4317732970","https://openalex.org/W4313289487","https://openalex.org/W4321636153"],"abstract_inverted_index":{"Random":[0],"forest":[1,58,106,145],"is":[2,25,60,175],"an":[3,139],"ensemble":[4],"classification":[5],"algorithm.":[6],"It":[7,87],"performs":[8],"well":[9],"when":[10,20,96],"most":[11],"predictive":[12,171],"variables":[13,24],"are":[14],"noisy":[15],"and":[16,38,111,164,181,203],"can":[17],"be":[18],"used":[19],"the":[21,29,81,108,127,185,196],"number":[22,30],"of":[23,31,35,41,50,55,70,104,142,151,157,187],"much":[26],"larger":[27],"than":[28,47],"observations.":[32],"The":[33,52,173,190],"use":[34],"bootstrap":[36],"samples":[37],"restricted":[39],"subsets":[40],"attributes":[42],"makes":[43,195],"it":[44,64],"more":[45],"powerful":[46],"simple":[48],"ensembles":[49],"trees.":[51],"main":[53,188],"advantage":[54],"a":[56,74,136,143,158],"random":[57,105,144],"classifier":[59],"its":[61,116],"explanatory":[62],"power:":[63],"measures":[65],"variable":[66],"importance":[67],"or":[68],"impact":[69],"each":[71],"factor":[72],"on":[73,98,177,184],"predicted":[75],"class":[76],"label.":[77],"These":[78],"characteristics":[79],"make":[80],"algorithm":[82,161,197],"ideal":[83],"for":[84,118,199],"microarray":[85,100,152],"data.":[86],"was":[88],"shown":[89],"to":[90],"build":[91],"models":[92],"with":[93],"high":[94],"accuracy":[95],"tested":[97],"high-dimensional":[99],"datasets.":[101],"Current":[102],"implementations":[103],"in":[107,132],"machine":[109],"learning":[110],"statistics":[112],"community,":[113],"however,":[114],"limit":[115],"usability":[117],"mining":[119],"over":[120],"large":[121],"datasets,":[122],"as":[123],"they":[124],"require":[125],"that":[126],"entire":[128],"dataset":[129],"remains":[130],"permanently":[131],"memory.":[133,189],"We":[134],"propose":[135],"new":[137],"framework,":[138],"optimized":[140],"implementation":[141,174],"classifier,":[146],"which":[147],"addresses":[148],"specific":[149],"properties":[150],"data,":[153],"takes":[154],"computational":[155,193],"complexity":[156],"decision":[159],"tree":[160],"into":[162],"consideration,":[163],"shows":[165],"excellent":[166,192],"computing":[167],"performance":[168,194],"while":[169],"preserving":[170],"accuracy.":[172],"based":[176],"reducing":[178],"overlapping":[179],"computations":[180],"eliminating":[182],"dependency":[183],"size":[186],"implementation's":[191],"useful":[198],"interactive":[200],"data":[201,204],"analyses":[202],"mining.":[205]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
