{"id":"https://openalex.org/W2010117910","doi":"https://doi.org/10.1021/ci900377e","title":"Insolubility Classification with Accurate Prediction Probabilities Using a MetaClassifier","display_name":"Insolubility Classification with Accurate Prediction Probabilities Using a MetaClassifier","publication_year":2010,"publication_date":"2010-01-20","ids":{"openalex":"https://openalex.org/W2010117910","doi":"https://doi.org/10.1021/ci900377e","mag":"2010117910","pmid":"https://pubmed.ncbi.nlm.nih.gov/20088498"},"language":"en","primary_location":{"id":"doi:10.1021/ci900377e","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci900377e","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078834012","display_name":"Christian Kr\u00e4mer","orcid":"https://orcid.org/0000-0001-8663-5266"},"institutions":[{"id":"https://openalex.org/I4210112752","display_name":"Boehringer Ingelheim (United Kingdom)","ror":"https://ror.org/01jnnpe14","country_code":"GB","type":"company","lineage":["https://openalex.org/I1330995197","https://openalex.org/I4210112752"]},{"id":"https://openalex.org/I63072094","display_name":"University of Portsmouth","ror":"https://ror.org/03ykbk197","country_code":"GB","type":"education","lineage":["https://openalex.org/I63072094"]},{"id":"https://openalex.org/I181369854","display_name":"Friedrich-Alexander-Universit\u00e4t Erlangen-N\u00fcrnberg","ror":"https://ror.org/00f7hpc57","country_code":"DE","type":"education","lineage":["https://openalex.org/I181369854"]}],"countries":["DE","GB"],"is_corresponding":true,"raw_author_name":"Christian Kramer","raw_affiliation_strings":["Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom","institution_ids":["https://openalex.org/I63072094","https://openalex.org/I4210112752","https://openalex.org/I181369854"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078568475","display_name":"Bernd Beck","orcid":null},"institutions":[{"id":"https://openalex.org/I181369854","display_name":"Friedrich-Alexander-Universit\u00e4t Erlangen-N\u00fcrnberg","ror":"https://ror.org/00f7hpc57","country_code":"DE","type":"education","lineage":["https://openalex.org/I181369854"]},{"id":"https://openalex.org/I4210112752","display_name":"Boehringer Ingelheim (United Kingdom)","ror":"https://ror.org/01jnnpe14","country_code":"GB","type":"company","lineage":["https://openalex.org/I1330995197","https://openalex.org/I4210112752"]},{"id":"https://openalex.org/I63072094","display_name":"University of Portsmouth","ror":"https://ror.org/03ykbk197","country_code":"GB","type":"education","lineage":["https://openalex.org/I63072094"]}],"countries":["DE","GB"],"is_corresponding":false,"raw_author_name":"Bernd Beck","raw_affiliation_strings":["Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom","institution_ids":["https://openalex.org/I63072094","https://openalex.org/I4210112752","https://openalex.org/I181369854"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017203543","display_name":"Timothy Clark","orcid":"https://orcid.org/0000-0001-7931-4659"},"institutions":[{"id":"https://openalex.org/I4210112752","display_name":"Boehringer Ingelheim (United Kingdom)","ror":"https://ror.org/01jnnpe14","country_code":"GB","type":"company","lineage":["https://openalex.org/I1330995197","https://openalex.org/I4210112752"]},{"id":"https://openalex.org/I63072094","display_name":"University of Portsmouth","ror":"https://ror.org/03ykbk197","country_code":"GB","type":"education","lineage":["https://openalex.org/I63072094"]},{"id":"https://openalex.org/I181369854","display_name":"Friedrich-Alexander-Universit\u00e4t Erlangen-N\u00fcrnberg","ror":"https://ror.org/00f7hpc57","country_code":"DE","type":"education","lineage":["https://openalex.org/I181369854"]}],"countries":["DE","GB"],"is_corresponding":false,"raw_author_name":"Timothy Clark","raw_affiliation_strings":["Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Lead Discovery, Boehringer-Ingelheim Pharma GmbH & Co. KG, 88397 Biberach, Germany, Computer-Chemie-Centrum and Interdisciplinary Center for Molecular Materials, Friedrich-Alexander Universit\u00e4t Erlangen-N\u00fcrnberg, N\u00e4gelsbachstrasse 52, 91052 Erlangen, Germany, and Centre for Molecular Design, University of Portsmouth, Mercantile House, Hampshire Terrace, Portsmouth, PO1 2EG, United Kingdom","institution_ids":["https://openalex.org/I63072094","https://openalex.org/I4210112752","https://openalex.org/I181369854"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5078834012"],"corresponding_institution_ids":["https://openalex.org/I181369854","https://openalex.org/I4210112752","https://openalex.org/I63072094"],"apc_list":null,"apc_paid":null,"fwci":4.3489,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.94271116,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"50","issue":"3","first_page":"404","last_page":"414"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11881","display_name":"Crystallization and Solubility Studies","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9804999828338623,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8433175683021545},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6218804717063904},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5692183375358582},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.5687171220779419},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5504345893859863},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.47501882910728455},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4560205936431885},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.44839608669281006},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4451344907283783},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.438040167093277},{"id":"https://openalex.org/keywords/cheminformatics","display_name":"Cheminformatics","score":0.4256441593170166},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4164563715457916},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36373937129974365},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.17499834299087524}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8433175683021545},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6218804717063904},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5692183375358582},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.5687171220779419},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5504345893859863},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.47501882910728455},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4560205936431885},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.44839608669281006},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4451344907283783},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.438040167093277},{"id":"https://openalex.org/C68762167","wikidata":"https://www.wikidata.org/wiki/Q910164","display_name":"Cheminformatics","level":2,"score":0.4256441593170166},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4164563715457916},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36373937129974365},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.17499834299087524},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012995","descriptor_name":"Solubility","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/ci900377e","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci900377e","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:20088498","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/20088498","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321026","display_name":"Ministry of Earth Sciences","ror":"https://ror.org/013cf5k59"},{"id":"https://openalex.org/F4320322099","display_name":"Korea Institute of Energy Research","ror":"https://ror.org/0298pes53"},{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W169410579","https://openalex.org/W1522205938","https://openalex.org/W1562218083","https://openalex.org/W1562347366","https://openalex.org/W1567512734","https://openalex.org/W1963847586","https://openalex.org/W1968688544","https://openalex.org/W1969387965","https://openalex.org/W1969747177","https://openalex.org/W1978163942","https://openalex.org/W1980956598","https://openalex.org/W1983938727","https://openalex.org/W1984687803","https://openalex.org/W1987749240","https://openalex.org/W1988195734","https://openalex.org/W1989816927","https://openalex.org/W1990057891","https://openalex.org/W2009638172","https://openalex.org/W2013894207","https://openalex.org/W2014518985","https://openalex.org/W2014722063","https://openalex.org/W2016263386","https://openalex.org/W2019966295","https://openalex.org/W2020602991","https://openalex.org/W2039155367","https://openalex.org/W2040389962","https://openalex.org/W2041392558","https://openalex.org/W2053184574","https://openalex.org/W2055800653","https://openalex.org/W2058935979","https://openalex.org/W2061481072","https://openalex.org/W2063346968","https://openalex.org/W2065717478","https://openalex.org/W2076498053","https://openalex.org/W2077973224","https://openalex.org/W2080653934","https://openalex.org/W2082601980","https://openalex.org/W2087661061","https://openalex.org/W2090996511","https://openalex.org/W2091263182","https://openalex.org/W2091758060","https://openalex.org/W2107983513","https://openalex.org/W2115758667","https://openalex.org/W2116452394","https://openalex.org/W2132450507","https://openalex.org/W2134976703","https://openalex.org/W2138095345","https://openalex.org/W2139212933","https://openalex.org/W2153635508","https://openalex.org/W2166008508","https://openalex.org/W2294798173","https://openalex.org/W2318099008","https://openalex.org/W2911964244","https://openalex.org/W4238793347","https://openalex.org/W4251903194","https://openalex.org/W4297957988"],"related_works":["https://openalex.org/W1574414179","https://openalex.org/W4362597605","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4297676672","https://openalex.org/W4281702477","https://openalex.org/W4378510483","https://openalex.org/W4376166922","https://openalex.org/W2490526372","https://openalex.org/W2889302474"],"abstract_inverted_index":{"Insolubility":[0],"is":[1,110,134],"a":[2,36,82,102,130],"crucial":[3],"issue":[4],"in":[5,67],"drug":[6],"design":[7],"because":[8],"insoluble":[9,146],"compounds":[10,42,147],"are":[11],"often":[12],"measured":[13,43],"to":[14,112],"be":[15,20],"inactive":[16],"although":[17],"they":[18,23],"might":[19],"active":[21],"if":[22],"were":[24,65],"soluble.":[25],"We":[26,80],"provide":[27],"and":[28,41,54,56,63,77,94,120,145,148],"analyze":[29],"various":[30],"insolubility":[31],"classification":[32],"models":[33],"based":[34],"on":[35,129],"recently":[37],"published":[38],"data":[39],"set":[40],"in-house":[44],"at":[45,95],"Boehringer-Ingelheim.":[46],"The":[47,107],"2D":[48],"descriptor":[49,59,100],"sets":[50,60],"from":[51,61],"pharmacophore":[52],"fingerprints":[53],"MOE":[55],"the":[57,90,96,113,137],"3D":[58],"ParaSurf":[62],"VolSurf":[64],"examined":[66],"conjunction":[68],"with":[69,136,139,158],"support":[70],"vector":[71],"machines,":[72],"Bayesian":[73],"regularized":[74],"neural":[75],"networks,":[76],"random":[78],"forests.":[79],"introduce":[81],"classifier-fusion":[83],"strategy,":[84],"called":[85],"metaclassifier,":[86,138],"which":[87],"improves":[88],"upon":[89],"best":[91],"single":[92],"prediction":[93,125,149],"same":[97],"time":[98],"avoids":[99],"selection,":[101],"potential":[103],"source":[104],"of":[105,117,127,143],"overfitting.":[106],"metaclassifier":[108],"strategy":[109],"compared":[111],"simpler":[114],"fusion":[115],"strategies":[116],"maximum":[118,155],"vote":[119],"highest":[121],"probability":[122],"picking.":[123],"A":[124],"accuracy":[126],"72.6%":[128],"three":[131],"class":[132],"model":[133],"achieved":[135],"nearly":[140],"perfect":[141],"separation":[142],"soluble":[144],"as":[150,152],"good":[151],"our":[153],"calculated":[154],"possible":[156],"agreement":[157],"experiment.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
