{"id":"https://openalex.org/W1990566000","doi":"https://doi.org/10.1021/ci5005652","title":"Improved Prediction of CYP-Mediated Metabolism with Chemical Fingerprints","display_name":"Improved Prediction of CYP-Mediated Metabolism with Chemical Fingerprints","publication_year":2015,"publication_date":"2015-04-14","ids":{"openalex":"https://openalex.org/W1990566000","doi":"https://doi.org/10.1021/ci5005652","mag":"1990566000","pmid":"https://pubmed.ncbi.nlm.nih.gov/25871613"},"language":"en","primary_location":{"id":"doi:10.1021/ci5005652","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci5005652","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007493323","display_name":"Jed Zaretzki","orcid":null},"institutions":[{"id":"https://openalex.org/I204465549","display_name":"Washington University in St. Louis","ror":"https://ror.org/01yc7t268","country_code":"US","type":"education","lineage":["https://openalex.org/I204465549"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jed Zaretzki","raw_affiliation_strings":["Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States"],"affiliations":[{"raw_affiliation_string":"Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":["https://openalex.org/I204465549"]},{"raw_affiliation_string":"Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079316337","display_name":"Kevin M. Boehm","orcid":"https://orcid.org/0000-0002-1703-5301"},"institutions":[{"id":"https://openalex.org/I204465549","display_name":"Washington University in St. Louis","ror":"https://ror.org/01yc7t268","country_code":"US","type":"education","lineage":["https://openalex.org/I204465549"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kevin M. Boehm","raw_affiliation_strings":["Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States"],"affiliations":[{"raw_affiliation_string":"Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":["https://openalex.org/I204465549"]},{"raw_affiliation_string":"Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086610385","display_name":"S. Joshua Swamidass","orcid":"https://orcid.org/0000-0003-2191-0778"},"institutions":[{"id":"https://openalex.org/I204465549","display_name":"Washington University in St. Louis","ror":"https://ror.org/01yc7t268","country_code":"US","type":"education","lineage":["https://openalex.org/I204465549"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. Joshua Swamidass","raw_affiliation_strings":["Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States"],"affiliations":[{"raw_affiliation_string":"Department of Pathology and\rImmunology, Washington University School of Medicine, Campus Box\r1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":["https://openalex.org/I204465549"]},{"raw_affiliation_string":"Department of Pathology and Immunology, Washington University School of Medicine, Campus Box 1097 Whitaker Hall, St. Louis, Missouri 63130, United States","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5007493323"],"corresponding_institution_ids":["https://openalex.org/I204465549"],"apc_list":null,"apc_paid":null,"fwci":2.8041,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.90737446,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"55","issue":"5","first_page":"972","last_page":"982"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10375","display_name":"Pharmacogenetics and Drug Metabolism","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3004","display_name":"Pharmacology"},"field":{"id":"https://openalex.org/fields/30","display_name":"Pharmacology, Toxicology and Pharmaceutics"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fingerprint","display_name":"Fingerprint (computing)","score":0.7387012839317322},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4991915225982666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43304935097694397},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42643263936042786},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.35634034872055054},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33135294914245605},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.15919992327690125}],"concepts":[{"id":"https://openalex.org/C2777826928","wikidata":"https://www.wikidata.org/wiki/Q3745713","display_name":"Fingerprint (computing)","level":2,"score":0.7387012839317322},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4991915225982666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43304935097694397},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42643263936042786},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.35634034872055054},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33135294914245605},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.15919992327690125}],"mesh":[{"descriptor_ui":"D001665","descriptor_name":"Binding Sites","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001665","descriptor_name":"Binding Sites","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001665","descriptor_name":"Binding Sites","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D003577","descriptor_name":"Cytochrome P-450 Enzyme System","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D007527","descriptor_name":"Isoenzymes","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020407","descriptor_name":"Internet","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020407","descriptor_name":"Internet","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020407","descriptor_name":"Internet","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/ci5005652","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci5005652","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:25871613","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/25871613","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1972390620","https://openalex.org/W1974254541","https://openalex.org/W1984648567","https://openalex.org/W1988037271","https://openalex.org/W1997039157","https://openalex.org/W2011805684","https://openalex.org/W2024469207","https://openalex.org/W2031017656","https://openalex.org/W2032271067","https://openalex.org/W2035091931","https://openalex.org/W2038702914","https://openalex.org/W2044834685","https://openalex.org/W2081301924","https://openalex.org/W2090505208","https://openalex.org/W2103965340","https://openalex.org/W2104925243","https://openalex.org/W2126829482","https://openalex.org/W2128302372","https://openalex.org/W2200810672"],"related_works":["https://openalex.org/W2364411142","https://openalex.org/W2033914206","https://openalex.org/W2146076056","https://openalex.org/W2163831990","https://openalex.org/W3003836766","https://openalex.org/W2046077695","https://openalex.org/W2389470892","https://openalex.org/W2997969508","https://openalex.org/W4309838615","https://openalex.org/W4293863368"],"abstract_inverted_index":{"Molecule":[0],"and":[1,109,122,137,177,197,247,255,260,302,305],"atom":[2,304],"fingerprints,":[3,8,277],"similar":[4],"to":[5,61,70,142],"path-based":[6],"Daylight":[7],"can":[9,68],"substantially":[10],"improve":[11],"the":[12,34,75,83,155,173,182,232,235,274],"accuracy":[13,84],"of":[14,36,41,64,77,85,95,102,140,165,170,225,297,311],"P450":[15,86,92],"site-of-metabolism":[16,87],"prediction":[17,88],"models.":[18,54,72,190],"Only":[19],"two":[20,175],"chemical":[21,80],"fingerprints":[22,49,60,81,207,215,238,280],"have":[23],"been":[24],"used":[25],"in":[26,172,200,263,295],"metabolism":[27,42,65,96,171,298,312],"prediction,":[28],"so":[29],"little":[30],"is":[31,45],"known":[32],"about":[33],"importance":[35],"fingerprint":[37,148,189],"parameters":[38],"on":[39,82,90,154,160,243],"site":[40,63,94,169,296,310],"predictions.":[43],"It":[44],"possible":[46],"that":[47,126,289],"different":[48,113,214,217,266,279,284],"might":[50],"yield":[51],"more":[52,144,185,203,222],"accurate":[53,186],"Here,":[55],"we":[56,105],"study":[57,106],"if":[58],"tuning":[59],"specific":[62,79],"data":[66,97,158],"sets":[67],"lead":[69],"improved":[71],"We":[73],"measure":[74],"impact":[76],"484":[78],"models":[89,149,313],"nine":[91],"isoform":[93],"sets.":[98],"Using":[99],"a":[100,124,168,195,221,258],"range":[101],"search":[103],"depths,":[104],"path,":[107],"circular,":[108],"subgraph":[110],"fingerprints.":[111,307],"Two":[112],"labelings,":[114],"also,":[115],"are":[116,252,291,318],"considered,":[117],"both":[118],"standard":[119],"SMILES":[120],"labels":[121],"also":[123],"labeling":[125],"marks":[127],"ring":[128],"bonds":[129],"differently":[130],"than":[131,187],"nonring":[132],"bonds,":[133],"enabling":[134],"ortho,":[135],"para,":[136],"meta":[138],"positioning":[139],"substituents":[141],"be":[143],"clearly":[145],"encoded.":[146],"Optimal":[147],"chosen":[150],"by":[151,300,315],"cross-validation":[152,210],"performance":[153],"full":[156],"training":[157],"are,":[159],"average,":[161,244],"3.8%":[162],"(Top-2;":[163],"percent":[164],"molecules":[166],"with":[167,278],"top":[174,236,275],"predictions)":[176],"1.4%":[178],"(AUC;":[179],"area":[180],"under":[181],"ROC":[183],"curve)":[184],"base":[188],"These":[191,250,286],"gains":[192,251,293],"represent,":[193,256],"respectively,":[194,257],"25.6%":[196],"16.7%":[198],"reduction":[199,262],"error.":[201,227,264],"A":[202],"rigorous":[204],"assessment":[205],"selects":[206],"within":[208],"each":[209],"fold,":[211],"sometimes":[212],"selecting":[213],"for":[216,283,320],"folds,":[218],"but":[219],"yielding":[220],"reliable":[223],"estimate":[224],"generalization":[226],"In":[228],"this":[229,316],"assessment,":[230],"averaging":[231],"scores":[233],"from":[234],"few":[237],"yields":[239],"performances":[240],"improvements":[241],"of,":[242],"3.0%":[245],"(Top-2)":[246],"0.7%":[248],"(AUC).":[249],"statistically":[253],"significant":[254],"20.1%":[259],"8.8%":[261],"Between":[265],"isoforms,":[267],"not":[268],"many":[269],"consistencies":[270],"were":[271],"observed":[272],"among":[273],"performing":[276],"working":[281],"best":[282],"isoforms.":[285],"results":[287],"suggest":[288],"there":[290],"important":[292],"achievable":[294],"modeling":[299],"including":[301],"optimizing":[303],"molecule":[306],"The":[308],"optimal":[309],"determined":[314],"approach":[317],"available":[319],"use":[321],"at":[322],"http://swami.wustl.edu/.":[323]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
