{"id":"https://openalex.org/W2078065540","doi":"https://doi.org/10.1021/ci800097k","title":"Data Mining the NCI60 to Predict Generalized Cytotoxicity","display_name":"Data Mining the NCI60 to Predict Generalized Cytotoxicity","publication_year":2008,"publication_date":"2008-06-28","ids":{"openalex":"https://openalex.org/W2078065540","doi":"https://doi.org/10.1021/ci800097k","mag":"2078065540","pmid":"https://pubmed.ncbi.nlm.nih.gov/18588283"},"language":"en","primary_location":{"id":"doi:10.1021/ci800097k","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci800097k","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2561991","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100722331","display_name":"Adam Lee","orcid":"https://orcid.org/0000-0002-0189-171X"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Adam C. Lee","raw_affiliation_strings":["Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013706483","display_name":"Kerby Shedden","orcid":"https://orcid.org/0000-0001-7222-6664"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kerby Shedden","raw_affiliation_strings":["Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004547426","display_name":"Gustavo R. Rosania","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gustavo R. Rosania","raw_affiliation_strings":["Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108390238","display_name":"Gordon M. Crippen","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gordon M. Crippen","raw_affiliation_strings":["Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of Medicinal Chemistry and Pharmaceutical Sciences, College of Pharmacy, and Department of Statistics, University of Michigan, Ann Arbor, Michigan 48109","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108390238"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":6.2093,"has_fulltext":false,"cited_by_count":39,"citation_normalized_percentile":{"value":0.96508728,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"48","issue":"7","first_page":"1379","last_page":"1388"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9775000214576721,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cytotoxic-t-cell","display_name":"Cytotoxic T cell","score":0.5620497465133667},{"id":"https://openalex.org/keywords/cytotoxicity","display_name":"Cytotoxicity","score":0.5616074204444885},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4823557734489441},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.46553388237953186},{"id":"https://openalex.org/keywords/quantitative-structure\u2013activity-relationship","display_name":"Quantitative structure\u2013activity relationship","score":0.462777704000473},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.45820334553718567},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.44200533628463745},{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.41627538204193115},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.3999221920967102},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.2916423976421356},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2510456442832947},{"id":"https://openalex.org/keywords/stereochemistry","display_name":"Stereochemistry","score":0.21774446964263916},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.1068926751613617},{"id":"https://openalex.org/keywords/in-vitro","display_name":"In vitro","score":0.09753495454788208}],"concepts":[{"id":"https://openalex.org/C154317977","wikidata":"https://www.wikidata.org/wiki/Q376266","display_name":"Cytotoxic T cell","level":3,"score":0.5620497465133667},{"id":"https://openalex.org/C109316439","wikidata":"https://www.wikidata.org/wiki/Q246181","display_name":"Cytotoxicity","level":3,"score":0.5616074204444885},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4823557734489441},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.46553388237953186},{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.462777704000473},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.45820334553718567},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.44200533628463745},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.41627538204193115},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.3999221920967102},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2916423976421356},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2510456442832947},{"id":"https://openalex.org/C71240020","wikidata":"https://www.wikidata.org/wiki/Q186011","display_name":"Stereochemistry","level":1,"score":0.21774446964263916},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.1068926751613617},{"id":"https://openalex.org/C202751555","wikidata":"https://www.wikidata.org/wiki/Q221681","display_name":"In vitro","level":2,"score":0.09753495454788208}],"mesh":[{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004354","descriptor_name":"Drug Screening Assays, Antitumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D004354","descriptor_name":"Drug Screening Assays, Antitumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D004354","descriptor_name":"Drug Screening Assays, Antitumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D004354","descriptor_name":"Drug Screening Assays, Antitumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D045744","descriptor_name":"Cell Line, Tumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D045744","descriptor_name":"Cell Line, Tumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D045744","descriptor_name":"Cell Line, Tumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D045744","descriptor_name":"Cell Line, Tumor","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":3,"locations":[{"id":"doi:10.1021/ci800097k","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci800097k","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:18588283","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/18588283","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:2561991","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2561991","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:2561991","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2561991","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"},"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.6499999761581421,"id":"https://metadata.un.org/sdg/3"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321026","display_name":"Ministry of Earth Sciences","ror":"https://ror.org/013cf5k59"},{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1640748652","https://openalex.org/W1970651561","https://openalex.org/W1973470802","https://openalex.org/W1975618638","https://openalex.org/W2005723242","https://openalex.org/W2049331434","https://openalex.org/W2051810242","https://openalex.org/W2066376270","https://openalex.org/W2080799570","https://openalex.org/W2095028909","https://openalex.org/W2117692612","https://openalex.org/W2125877278","https://openalex.org/W2146431863","https://openalex.org/W2463436485","https://openalex.org/W2797583072","https://openalex.org/W3175318380"],"related_works":["https://openalex.org/W2024203776","https://openalex.org/W1892306976","https://openalex.org/W2155804408","https://openalex.org/W1997573797","https://openalex.org/W2029611001","https://openalex.org/W2166496668","https://openalex.org/W2072827207","https://openalex.org/W2008095939","https://openalex.org/W2036648450","https://openalex.org/W1999796036"],"abstract_inverted_index":{"Elimination":[0],"of":[1,10,18,25,41,55,63,65,78,99,119,129,132,151],"cytotoxic":[2,53,201],"compounds":[3],"in":[4,124,148,203],"the":[5,16,23,42,51,61,84,97,100,120,127,130,152,164,181],"early":[6],"and":[7,20,36,176,183,205,212],"later":[8],"stages":[9],"drug":[11],"discovery":[12],"can":[13,114,159,195],"help":[14],"reduce":[15],"costs":[17],"research":[19],"development.":[21],"Through":[22],"application":[24],"principal":[26],"components":[27],"analysis":[28],"(PCA),":[29],"we":[30,105,140],"were":[31],"able":[32],"to":[33,50,60,83,92,162,198],"data":[34],"mine":[35],"prove":[37],"that":[38,113],"approximately":[39],"89%":[40],"total":[43],"log":[44,102,134,166,186],"GI":[45,103,135,167,187],"50":[46,136,188],"variance":[47],"is":[48],"due":[49],"nonspecific":[52,94],"nature":[54],"substances.":[56],"Furthermore,":[57],"PCA":[58],"led":[59],"identification":[62],"groups":[64],"structurally":[66],"unrelated":[67],"substances":[68,80,121],"showing":[69],"very":[70],"specific":[71],"toxicity":[72],"profiles,":[73],"such":[74],"as":[75,122],"a":[76,107,143,177],"set":[77],"45":[79],"toxic":[81],"only":[82],"Leukemia_SR":[85],"cancer":[86,156],"cell":[87,157],"line.":[88],"In":[89],"an":[90],"effort":[91],"predict":[93,163],"cytotoxicity":[95],"on":[96,126],"basis":[98,128],"mean":[101,133,165,185],"50,":[104],"created":[106],"decision":[108],"tree":[109],"using":[110,146],"MACCS":[111],"keys":[112],"correctly":[115],"classify":[116],"over":[117],"83%":[118],"cytotoxic/noncytotoxic":[123],"silico,":[125],"cutoff":[131],"=":[137,174,190],"-5.0.":[138],"Finally,":[139],"have":[141],"established":[142],"linear":[144],"model":[145,170],"least-squares":[147],"which":[149],"nine":[150],"59":[153],"available":[154],"NCI60":[155],"lines":[158],"be":[160,196],"used":[161],"50.":[168],"The":[169],"has":[171],"R":[172],"(2)":[173],"0.99":[175],"root-mean-square":[178],"deviation":[179],"between":[180],"observed":[182],"calculated":[184],"(RMSE)":[189],"0.09.":[191],"Our":[192],"predictive":[193],"models":[194],"applied":[197],"flag":[199],"generally":[200],"molecules":[202],"virtual":[204],"real":[206],"chemical":[207],"libraries,":[208],"thus":[209],"saving":[210],"time":[211],"effort.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-17T06:14:20.161405","created_date":"2025-10-10T00:00:00"}
