{"id":"https://openalex.org/W3091686725","doi":"https://doi.org/10.1109/access.2020.3027828","title":"Extension of pQSAR: Ensemble Model Generated by Random Forest and Partial Least Squares Regressions","display_name":"Extension of pQSAR: Ensemble Model Generated by Random Forest and Partial Least Squares Regressions","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3091686725","doi":"https://doi.org/10.1109/access.2020.3027828","mag":"3091686725"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3027828","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027828","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09210102.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09210102.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101705210","display_name":"Byung Chun Kim","orcid":"https://orcid.org/0000-0002-3895-3021"},"institutions":[{"id":"https://openalex.org/I4210158432","display_name":"National Institute for Mathematical Sciences","ror":"https://ror.org/04n7py080","country_code":"KR","type":"education","lineage":["https://openalex.org/I4210158432"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Byung Chun Kim","raw_affiliation_strings":["National Institute for Mathematical Science, Daejeon, South Korea"],"raw_orcid":"https://orcid.org/0000-0002-3895-3021","affiliations":[{"raw_affiliation_string":"National Institute for Mathematical Science, Daejeon, South Korea","institution_ids":["https://openalex.org/I4210158432"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042118829","display_name":"Dosang Joe","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158432","display_name":"National Institute for Mathematical Sciences","ror":"https://ror.org/04n7py080","country_code":"KR","type":"education","lineage":["https://openalex.org/I4210158432"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Dosang Joe","raw_affiliation_strings":["National Institute for Mathematical Science, Daejeon, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute for Mathematical Science, Daejeon, South Korea","institution_ids":["https://openalex.org/I4210158432"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080174843","display_name":"Youngho Woo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158432","display_name":"National Institute for Mathematical Sciences","ror":"https://ror.org/04n7py080","country_code":"KR","type":"education","lineage":["https://openalex.org/I4210158432"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Youngho Woo","raw_affiliation_strings":["National Institute for Mathematical Science, Daejeon, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Institute for Mathematical Science, Daejeon, South Korea","institution_ids":["https://openalex.org/I4210158432"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079853146","display_name":"Yongkuk Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I31419693","display_name":"Kyungpook National University","ror":"https://ror.org/040c17130","country_code":"KR","type":"education","lineage":["https://openalex.org/I31419693"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yongkuk Kim","raw_affiliation_strings":["Kyungpook National University, Daegu, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kyungpook National University, Daegu, South Korea","institution_ids":["https://openalex.org/I31419693"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065291585","display_name":"Gang-Joon Yoon","orcid":"https://orcid.org/0000-0002-0654-491X"},"institutions":[{"id":"https://openalex.org/I4210158432","display_name":"National Institute for Mathematical Sciences","ror":"https://ror.org/04n7py080","country_code":"KR","type":"education","lineage":["https://openalex.org/I4210158432"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gangjoon Yoon","raw_affiliation_strings":["National Institute for Mathematical Science, Daejeon, South Korea"],"raw_orcid":"https://orcid.org/0000-0002-0654-491X","affiliations":[{"raw_affiliation_string":"National Institute for Mathematical Science, Daejeon, South Korea","institution_ids":["https://openalex.org/I4210158432"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101705210"],"corresponding_institution_ids":["https://openalex.org/I4210158432"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.5826,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.74300781,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":"8","issue":null,"first_page":"180087","last_page":"180099"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9830999970436096,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/partial-least-squares-regression","display_name":"Partial least squares regression","score":0.8390878438949585},{"id":"https://openalex.org/keywords/chembl","display_name":"chEMBL","score":0.797214925289154},{"id":"https://openalex.org/keywords/quantitative-structure\u2013activity-relationship","display_name":"Quantitative structure\u2013activity relationship","score":0.7435051202774048},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.7027006149291992},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5733072757720947},{"id":"https://openalex.org/keywords/applicability-domain","display_name":"Applicability domain","score":0.5329561829566956},{"id":"https://openalex.org/keywords/extension","display_name":"Extension (predicate logic)","score":0.4989292621612549},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.4810481369495392},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.47457268834114075},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.46602556109428406},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45220279693603516},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4276212453842163},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4141732454299927},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.36107009649276733},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.35864412784576416},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3313259482383728},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.120425283908844},{"id":"https://openalex.org/keywords/drug-discovery","display_name":"Drug discovery","score":0.11230549216270447}],"concepts":[{"id":"https://openalex.org/C22354355","wikidata":"https://www.wikidata.org/wiki/Q422009","display_name":"Partial least squares regression","level":2,"score":0.8390878438949585},{"id":"https://openalex.org/C63222358","wikidata":"https://www.wikidata.org/wiki/Q6120337","display_name":"chEMBL","level":3,"score":0.797214925289154},{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.7435051202774048},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.7027006149291992},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5733072757720947},{"id":"https://openalex.org/C107908354","wikidata":"https://www.wikidata.org/wiki/Q4781456","display_name":"Applicability domain","level":3,"score":0.5329561829566956},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.4989292621612549},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4810481369495392},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.47457268834114075},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.46602556109428406},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45220279693603516},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4276212453842163},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4141732454299927},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.36107009649276733},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.35864412784576416},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3313259482383728},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.120425283908844},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.11230549216270447},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3027828","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027828","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09210102.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:ba480caea6ca4f9993e9a125381ab8e8","is_oa":true,"landing_page_url":"https://doaj.org/article/ba480caea6ca4f9993e9a125381ab8e8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 180087-180099 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3027828","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027828","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09210102.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land","score":0.7300000190734863}],"awards":[{"id":"https://openalex.org/G1984158407","display_name":null,"funder_award_id":"NIMS-B20900000","funder_id":"https://openalex.org/F4320314264","funder_display_name":"Institute of Mathematical Sciences"}],"funders":[{"id":"https://openalex.org/F4320314264","display_name":"Institute of Mathematical Sciences","ror":"https://ror.org/05078rg59"},{"id":"https://openalex.org/F4320334904","display_name":"National Institute for Materials Science","ror":"https://ror.org/026v1ze26"},{"id":"https://openalex.org/F4320337380","display_name":"Division of Mathematical Sciences","ror":"https://ror.org/051fftw81"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3091686725.pdf","grobid_xml":"https://content.openalex.org/works/W3091686725.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W127874241","https://openalex.org/W1501372585","https://openalex.org/W1531524766","https://openalex.org/W1534477342","https://openalex.org/W1605923270","https://openalex.org/W1975875968","https://openalex.org/W1988195734","https://openalex.org/W1999798000","https://openalex.org/W2005361085","https://openalex.org/W2007953805","https://openalex.org/W2019966295","https://openalex.org/W2025649629","https://openalex.org/W2046653925","https://openalex.org/W2084446624","https://openalex.org/W2120771633","https://openalex.org/W2122811202","https://openalex.org/W2135293965","https://openalex.org/W2138525748","https://openalex.org/W2232501282","https://openalex.org/W2522945796","https://openalex.org/W2531064432","https://openalex.org/W2604060680","https://openalex.org/W2607306668","https://openalex.org/W2714724074","https://openalex.org/W2902800472","https://openalex.org/W2903306934","https://openalex.org/W2903803734","https://openalex.org/W2934083573","https://openalex.org/W2942245950","https://openalex.org/W2972499938","https://openalex.org/W2973093569","https://openalex.org/W2982188507","https://openalex.org/W4246656997","https://openalex.org/W4301433451","https://openalex.org/W6632075054","https://openalex.org/W6644359581"],"related_works":["https://openalex.org/W2746158299","https://openalex.org/W1969085205","https://openalex.org/W1977382278","https://openalex.org/W2399851305","https://openalex.org/W1970841929","https://openalex.org/W2985099987","https://openalex.org/W2792658424","https://openalex.org/W2309296013","https://openalex.org/W3005120176","https://openalex.org/W2055287694"],"abstract_inverted_index":{"Quantitative":[0],"structure-activity":[1],"relationship":[2],"(QSAR)":[3],"regression":[4,87],"models":[5],"are":[6,122,131],"mathematical":[7],"ones":[8],"which":[9],"relate":[10],"the":[11,17,20,24,29,35,94,106,112,116,128,139,143,149,170,191,209,212,243],"structural":[12],"properties":[13],"of":[14,19,23,34,54,78,115,160,168,180,201,204,211,233,242],"chemicals":[15],"to":[16,141,240],"potencies":[18],"biological":[21],"activities":[22],"chemicals.":[25,55],"In":[26,89,152],"QSAR":[27,57],"models,":[28,182],"physical":[30],"and":[31,83,101,127,146,165,184,193,206],"chemical":[32],"information":[33],"molecules":[36],"is":[37,66],"encoded":[38],"into":[39],"quantitative":[40],"numbers":[41],"called":[42],"descriptors.":[43],"Recently,":[44],"experimental":[45],"test":[46],"results":[47],"(profiles)":[48],"have":[49],"been":[50,187],"used":[51],"as":[52],"descriptors":[53],"Profile":[56],"2.0":[58],"(pQSAR)":[59],"model":[60,159,226],"suggested":[61],"by":[62,163,177],"Martin":[63],"et":[64],"al.,":[65],"a":[67,76],"multitask,":[68],"two":[69,178],"step":[70,114],"machine":[71],"learning":[72],"prediction":[73,181,199,229],"method":[74],"with":[75,99],"combination":[77,203],"random":[79],"forest":[80],"regressions":[81],"(RFRs)":[82],"partial":[84],"least":[85],"squares":[86],"(PLSR).":[88],"pQSAR":[90,117,161,244],"model,":[91],"one":[92],"fills":[93],"profile":[95,107,144,175,216],"table's":[96],"missing":[97],"values":[98],"RFRs":[100,164,183,205],"then":[102,147],"builds":[103],"PLSR":[104],"using":[105],"predictions.":[108],"Note":[109],"that":[110,241],"in":[111,231],"second":[113,150],"method,":[118],"PLSR's":[119],"predictor":[120],"variables":[121,130],"profiles;":[123],"so":[124],"activity":[125,133],"values,":[126],"response":[129],"also":[132],"values.":[134],"Thus":[135],"we":[136,155],"can":[137],"use":[138],"PLSRs":[140,207],"update":[142],"table":[145,176],"repeat":[148],"step.":[151],"this":[153],"work,":[154],"propose":[156],"an":[157],"extended":[158],"generated":[162],"PLSRs.":[166],"Experiment":[167],"updating":[169],"given":[171,219],"full":[172],"initially":[173],"predicted":[174,215],"kinds":[179],"PLSRs,":[185],"has":[186,227],"conducted":[188],"iteratively":[189],"for":[190,218],"PKIS":[192],"ChEMBL":[194],"data":[195],"sets.":[196],"Even":[197],"though":[198],"performance":[200,230],"individual":[202],"varies,":[208],"average":[210],"all":[213],"possible":[214],"tables":[217],"iteration":[220],"shows":[221],"better":[222,228],"performance.":[223],"This":[224],"ensemble":[225],"sense":[232],"Pearson's":[234],"R":[235],"<sup":[236],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[237],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[238],"compared":[239],"model.":[245]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
