{"id":"https://openalex.org/W2041392558","doi":"https://doi.org/10.1021/ci060164k","title":"Random Forest Models To Predict Aqueous Solubility","display_name":"Random Forest Models To Predict Aqueous Solubility","publication_year":2006,"publication_date":"2006-12-02","ids":{"openalex":"https://openalex.org/W2041392558","doi":"https://doi.org/10.1021/ci060164k","mag":"2041392558","pmid":"https://pubmed.ncbi.nlm.nih.gov/17238260"},"language":"en","primary_location":{"id":"doi:10.1021/ci060164k","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci060164k","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069304320","display_name":"David Scott Palmer","orcid":"https://orcid.org/0000-0003-4356-9144"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"David S. Palmer","raw_affiliation_strings":["Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","Physics"],"affiliations":[{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]},{"raw_affiliation_string":"Physics","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036721569","display_name":"Noel M. O\u2019Boyle","orcid":"https://orcid.org/0000-0003-4879-2003"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Noel M. O'Boyle","raw_affiliation_strings":["Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,"],"affiliations":[{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]},{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014283781","display_name":"Robert C. Glen","orcid":"https://orcid.org/0000-0003-1759-2914"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]},{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robert C. Glen","raw_affiliation_strings":["Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,"],"affiliations":[{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]},{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046050351","display_name":"John B. O. Mitchell","orcid":"https://orcid.org/0000-0002-0379-6097"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"John B. O. Mitchell","raw_affiliation_strings":["Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,"],"affiliations":[{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]},{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, University of Cambridge, Lensfield Road, Cambridge CB2 1EW, United Kingdom,","institution_ids":["https://openalex.org/I241749","https://openalex.org/I1342131907"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5069304320"],"corresponding_institution_ids":["https://openalex.org/I1342131907","https://openalex.org/I241749"],"apc_list":null,"apc_paid":null,"fwci":5.7296,"has_fulltext":false,"cited_by_count":369,"citation_normalized_percentile":{"value":0.96431572,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"47","issue":"1","first_page":"150","last_page":"158"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11881","display_name":"Crystallization and Solubility Studies","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.7988712191581726},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.7629446983337402},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.6492449045181274},{"id":"https://openalex.org/keywords/quantitative-structure\u2013activity-relationship","display_name":"Quantitative structure\u2013activity relationship","score":0.6275774836540222},{"id":"https://openalex.org/keywords/partial-least-squares-regression","display_name":"Partial least squares regression","score":0.6228436231613159},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.562663733959198},{"id":"https://openalex.org/keywords/solubility","display_name":"Solubility","score":0.5595479011535645},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.5196958184242249},{"id":"https://openalex.org/keywords/molecular-descriptor","display_name":"Molecular descriptor","score":0.5127668976783752},{"id":"https://openalex.org/keywords/least-squares-support-vector-machine","display_name":"Least squares support vector machine","score":0.4964335560798645},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47409090399742126},{"id":"https://openalex.org/keywords/linear-regression","display_name":"Linear regression","score":0.46788424253463745},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4678400754928589},{"id":"https://openalex.org/keywords/correlation-coefficient","display_name":"Correlation coefficient","score":0.4588163495063782},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45059144496917725},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.44291743636131287},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.4212367534637451},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4192023277282715},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3985349237918854},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.39353296160697937},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.3919222056865692},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.30448421835899353},{"id":"https://openalex.org/keywords/organic-chemistry","display_name":"Organic chemistry","score":0.0944347083568573}],"concepts":[{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.7988712191581726},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.7629446983337402},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.6492449045181274},{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.6275774836540222},{"id":"https://openalex.org/C22354355","wikidata":"https://www.wikidata.org/wiki/Q422009","display_name":"Partial least squares regression","level":2,"score":0.6228436231613159},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.562663733959198},{"id":"https://openalex.org/C155574463","wikidata":"https://www.wikidata.org/wiki/Q170731","display_name":"Solubility","level":2,"score":0.5595479011535645},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.5196958184242249},{"id":"https://openalex.org/C164923092","wikidata":"https://www.wikidata.org/wiki/Q3705921","display_name":"Molecular descriptor","level":3,"score":0.5127668976783752},{"id":"https://openalex.org/C145828037","wikidata":"https://www.wikidata.org/wiki/Q17086219","display_name":"Least squares support vector machine","level":3,"score":0.4964335560798645},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47409090399742126},{"id":"https://openalex.org/C48921125","wikidata":"https://www.wikidata.org/wiki/Q10861030","display_name":"Linear regression","level":2,"score":0.46788424253463745},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4678400754928589},{"id":"https://openalex.org/C2780092901","wikidata":"https://www.wikidata.org/wiki/Q3433612","display_name":"Correlation coefficient","level":2,"score":0.4588163495063782},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45059144496917725},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.44291743636131287},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.4212367534637451},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4192023277282715},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3985349237918854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39353296160697937},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.3919222056865692},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.30448421835899353},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0944347083568573},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D009930","descriptor_name":"Organic Chemicals","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D009930","descriptor_name":"Organic Chemicals","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D009930","descriptor_name":"Organic Chemicals","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D009930","descriptor_name":"Organic Chemicals","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012044","descriptor_name":"Regression Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012044","descriptor_name":"Regression Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012044","descriptor_name":"Regression Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012044","descriptor_name":"Regression Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D014867","descriptor_name":"Water","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D014867","descriptor_name":"Water","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D014867","descriptor_name":"Water","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D014867","descriptor_name":"Water","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1021/ci060164k","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci060164k","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:17238260","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/17238260","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:strathprints.strath.ac.uk:39174","is_oa":false,"landing_page_url":"https://strathprints.strath.ac.uk/39174/","pdf_url":null,"source":{"id":"https://openalex.org/S4306402226","display_name":"Strathprints: The University of Strathclyde institutional repository (University of Strathclyde)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I181647926","host_organization_name":"University of Strathclyde","host_organization_lineage":["https://openalex.org/I181647926"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.574.8101","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.574.8101","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.msm.cam.ac.uk/pfizer/pdf/Publications/P13 (03) - Random Forest Models To Predict Aqueous Solubility.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","score":0.75,"display_name":"Life in Land"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320307765","display_name":"Pfizer","ror":"https://ror.org/01xdqrp08"},{"id":"https://openalex.org/F4320309585","display_name":"Unilever","ror":"https://ror.org/05n8ah907"},{"id":"https://openalex.org/F4320334629","display_name":"Biotechnology and Biological Sciences Research Council","ror":"https://ror.org/00cwqg982"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W273955616","https://openalex.org/W1568759573","https://openalex.org/W1594031697","https://openalex.org/W1601740268","https://openalex.org/W1980739931","https://openalex.org/W1983938727","https://openalex.org/W1988195734","https://openalex.org/W2013894207","https://openalex.org/W2019980219","https://openalex.org/W2025948031","https://openalex.org/W2033511432","https://openalex.org/W2040446474","https://openalex.org/W2052723761","https://openalex.org/W2055800653","https://openalex.org/W2063346968","https://openalex.org/W2076498053","https://openalex.org/W2076802558","https://openalex.org/W2080242559","https://openalex.org/W2085890279","https://openalex.org/W2094836090","https://openalex.org/W2099014892","https://openalex.org/W2107983513","https://openalex.org/W2109978476","https://openalex.org/W2146060259","https://openalex.org/W2162429866","https://openalex.org/W2166008508","https://openalex.org/W2197112043","https://openalex.org/W2206827903","https://openalex.org/W2330820318","https://openalex.org/W2911964244","https://openalex.org/W4299796063"],"related_works":["https://openalex.org/W2033669961","https://openalex.org/W2148009427","https://openalex.org/W1518515965","https://openalex.org/W1978931025","https://openalex.org/W3159291941","https://openalex.org/W2063120953","https://openalex.org/W2753230657","https://openalex.org/W2165637039","https://openalex.org/W2026843845","https://openalex.org/W2889092195"],"abstract_inverted_index":{"Random":[0,37],"Forest":[1,38],"regression":[2,39,166],"(RF),":[3],"Partial-Least-Squares":[4],"(PLS)":[5],"regression,":[6],"Support":[7],"Vector":[8],"Machines":[9],"(SVM),":[10],"and":[11,52,54,66,107,139],"Artificial":[12],"Neural":[13],"Networks":[14],"(ANN)":[15],"were":[16],"used":[17],"to":[18,77,129,144],"develop":[19],"QSPR":[20],"models":[21],"for":[22,32,57,87],"the":[23,121,123,134,137,145,152,158,165],"prediction":[24,82],"of":[25,63,70,74,83,92,136,160],"aqueous":[26,42],"solubility,":[27],"based":[28],"on":[29,157],"experimental":[30],"data":[31,117,155],"988":[33],"organic":[34],"molecules.":[35],"The":[36,81],"model":[40,124],"predicted":[41],"solubility":[43,86],"more":[44],"accurately":[45],"than":[46],"those":[47],"created":[48],"by":[49,149,164],"PLS,":[50],"SVM,":[51],"ANN":[53],"offered":[55],"methods":[56],"automatic":[58],"descriptor":[59,64],"selection,":[60],"an":[61,67,88,103],"assessment":[62],"importance,":[65],"in-parallel":[68],"measure":[69],"predictive":[71],"ability,":[72],"all":[73],"which":[75],"serve":[76],"recommend":[78],"its":[79],"use.":[80],"log":[84,111],"molar":[85],"external":[89],"test":[90,140],"set":[91,118],"330":[93],"molecules":[94,150],"that":[95],"are":[96,142],"solid":[97],"at":[98],"25":[99],"degrees":[100],"C":[101],"gave":[102],"r2":[104],"=":[105,109],"0.89":[106],"RMSE":[108],"0.69":[110],"S":[112],"units.":[113],"For":[114],"a":[115],"standard":[116],"selected":[119,163],"from":[120],"literature,":[122],"performed":[125],"well":[126],"with":[127],"respect":[128],"other":[130],"documented":[131],"methods.":[132],"Finally,":[133],"diversity":[135],"training":[138],"sets":[141],"compared":[143],"chemical":[146],"space":[147],"occupied":[148],"in":[151],"MDL":[153],"drug":[154],"report,":[156],"basis":[159],"molecular":[161],"descriptors":[162],"analysis.":[167]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":26},{"year":2024,"cited_by_count":26},{"year":2023,"cited_by_count":26},{"year":2022,"cited_by_count":30},{"year":2021,"cited_by_count":36},{"year":2020,"cited_by_count":40},{"year":2019,"cited_by_count":25},{"year":2018,"cited_by_count":25},{"year":2017,"cited_by_count":17},{"year":2016,"cited_by_count":11},{"year":2015,"cited_by_count":13},{"year":2014,"cited_by_count":19},{"year":2013,"cited_by_count":10},{"year":2012,"cited_by_count":8}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
