{"id":"https://openalex.org/W2810048461","doi":"https://doi.org/10.1021/acs.jcim.8b00114","title":"General Approach to Estimate Error Bars for Quantitative Structure\u2013Activity Relationship Predictions of Molecular Activity","display_name":"General Approach to Estimate Error Bars for Quantitative Structure\u2013Activity Relationship Predictions of Molecular Activity","publication_year":2018,"publication_date":"2018-06-27","ids":{"openalex":"https://openalex.org/W2810048461","doi":"https://doi.org/10.1021/acs.jcim.8b00114","mag":"2810048461","pmid":"https://pubmed.ncbi.nlm.nih.gov/29949366"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.8b00114","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.8b00114","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100738736","display_name":"Ruifeng Liu","orcid":"https://orcid.org/0000-0001-7582-9217"},"institutions":[{"id":"https://openalex.org/I2802581893","display_name":"United States Army Medical Research and Development Command","ror":"https://ror.org/03cd02q50","country_code":"US","type":"facility","lineage":["https://openalex.org/I106965489","https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2802581893"]},{"id":"https://openalex.org/I2800986571","display_name":"Telemedicine & Advanced Technology Research Center","ror":"https://ror.org/014pvr265","country_code":"US","type":"funder","lineage":["https://openalex.org/I106965489","https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2800986571","https://openalex.org/I2802581893"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ruifeng Liu","raw_affiliation_strings":["Department of Defense Biotechnology High Performance Computing Software Applications Institute, Telemedicine and Advanced Technology Research Center, U.S. Army Medical Research and Materiel Command, Fort Detrick, Maryland 21702, United States"],"affiliations":[{"raw_affiliation_string":"Department of Defense Biotechnology High Performance Computing Software Applications Institute, Telemedicine and Advanced Technology Research Center, U.S. Army Medical Research and Materiel Command, Fort Detrick, Maryland 21702, United States","institution_ids":["https://openalex.org/I2802581893","https://openalex.org/I2800986571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080632719","display_name":"Kyle Glover","orcid":null},"institutions":[{"id":"https://openalex.org/I1331871522","display_name":"Defense Threat Reduction Agency","ror":"https://ror.org/04tz64554","country_code":"US","type":"government","lineage":["https://openalex.org/I1296703163","https://openalex.org/I1330347796","https://openalex.org/I1330347796","https://openalex.org/I1331871522"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kyle P. Glover","raw_affiliation_strings":["Defense Threat Reduction Agency, Aberdeen Proving Ground, Maryland 21010, United States"],"affiliations":[{"raw_affiliation_string":"Defense Threat Reduction Agency, Aberdeen Proving Ground, Maryland 21010, United States","institution_ids":["https://openalex.org/I1331871522"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004092384","display_name":"Michael G. Feasel","orcid":"https://orcid.org/0000-0001-7029-2764"},"institutions":[{"id":"https://openalex.org/I4387153805","display_name":"U.S. Army Combat Capabilities Development Command Chemical Biological Center","ror":"https://ror.org/022j0mn33","country_code":null,"type":"government","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2802705668","https://openalex.org/I4210154437","https://openalex.org/I4387153805"]},{"id":"https://openalex.org/I4210088792","display_name":"United States Army","ror":"https://ror.org/00afsp483","country_code":"US","type":"funder","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I4210088792"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael G. Feasel","raw_affiliation_strings":["U.S. Army\u2014Edgewood Chemical Biological Center, Operational Toxicology, Aberdeen Proving Ground, Maryland 21010, United States"],"affiliations":[{"raw_affiliation_string":"U.S. Army\u2014Edgewood Chemical Biological Center, Operational Toxicology, Aberdeen Proving Ground, Maryland 21010, United States","institution_ids":["https://openalex.org/I4210088792","https://openalex.org/I4387153805"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030271505","display_name":"Anders Wallqvist","orcid":"https://orcid.org/0000-0002-9775-7469"},"institutions":[{"id":"https://openalex.org/I2800986571","display_name":"Telemedicine & Advanced Technology Research Center","ror":"https://ror.org/014pvr265","country_code":"US","type":"funder","lineage":["https://openalex.org/I106965489","https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2800986571","https://openalex.org/I2802581893"]},{"id":"https://openalex.org/I2802581893","display_name":"United States Army Medical Research and Development Command","ror":"https://ror.org/03cd02q50","country_code":"US","type":"facility","lineage":["https://openalex.org/I106965489","https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I2802581893"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Anders Wallqvist","raw_affiliation_strings":["Department of Defense Biotechnology High Performance Computing Software Applications Institute, Telemedicine and Advanced Technology Research Center, U.S. Army Medical Research and Materiel Command, Fort Detrick, Maryland 21702, United States"],"affiliations":[{"raw_affiliation_string":"Department of Defense Biotechnology High Performance Computing Software Applications Institute, Telemedicine and Advanced Technology Research Center, U.S. Army Medical Research and Materiel Command, Fort Detrick, Maryland 21702, United States","institution_ids":["https://openalex.org/I2802581893","https://openalex.org/I2800986571"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5030271505","https://openalex.org/A5100738736"],"corresponding_institution_ids":["https://openalex.org/I2800986571","https://openalex.org/I2802581893"],"apc_list":null,"apc_paid":null,"fwci":3.8368,"has_fulltext":false,"cited_by_count":44,"citation_normalized_percentile":{"value":0.94497712,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"58","issue":"8","first_page":"1561","last_page":"1575"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9610999822616577,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9567999839782715,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/error-bar","display_name":"Error bar","score":0.5480974316596985},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.3838244378566742},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.36104416847229004},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3309820890426636},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.3010573387145996},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.30007636547088623},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.17590606212615967}],"concepts":[{"id":"https://openalex.org/C170797541","wikidata":"https://www.wikidata.org/wiki/Q452399","display_name":"Error bar","level":2,"score":0.5480974316596985},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3838244378566742},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.36104416847229004},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3309820890426636},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.3010573387145996},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30007636547088623},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.17590606212615967}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D035501","descriptor_name":"Uncertainty","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D035501","descriptor_name":"Uncertainty","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D035501","descriptor_name":"Uncertainty","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000494","qualifier_name":"pharmacology","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000494","qualifier_name":"pharmacology","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000494","qualifier_name":"pharmacology","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000633","qualifier_name":"toxicity","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000633","qualifier_name":"toxicity","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000633","qualifier_name":"toxicity","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D054852","descriptor_name":"Small Molecule Libraries","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.8b00114","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.8b00114","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:29949366","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/29949366","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5851990620","display_name":null,"funder_award_id":"CBCall14-CBS-05-2-0007","funder_id":"https://openalex.org/F4320332186","funder_display_name":"Defense Threat Reduction Agency"}],"funders":[{"id":"https://openalex.org/F4320332186","display_name":"Defense Threat Reduction Agency","ror":"https://ror.org/04tz64554"},{"id":"https://openalex.org/F4320338280","display_name":"Medical Research and Materiel Command","ror":"https://ror.org/03cd02q50"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1963602805","https://openalex.org/W1964114566","https://openalex.org/W1965106906","https://openalex.org/W1970334426","https://openalex.org/W1988037271","https://openalex.org/W1988848470","https://openalex.org/W1989485111","https://openalex.org/W1990399577","https://openalex.org/W1993492933","https://openalex.org/W2003032055","https://openalex.org/W2013894207","https://openalex.org/W2015931265","https://openalex.org/W2017398555","https://openalex.org/W2025556769","https://openalex.org/W2042278642","https://openalex.org/W2048611698","https://openalex.org/W2054111413","https://openalex.org/W2057910058","https://openalex.org/W2079444823","https://openalex.org/W2079699273","https://openalex.org/W2085890279","https://openalex.org/W2089578131","https://openalex.org/W2090999676","https://openalex.org/W2097793132","https://openalex.org/W2099538400","https://openalex.org/W2099568216","https://openalex.org/W2129893339","https://openalex.org/W2133679578","https://openalex.org/W2136701534","https://openalex.org/W2174230067","https://openalex.org/W2176009755","https://openalex.org/W2201106676","https://openalex.org/W2290847742","https://openalex.org/W2294516783","https://openalex.org/W2396527967","https://openalex.org/W2407586185","https://openalex.org/W2549144853","https://openalex.org/W3100157108","https://openalex.org/W4238793347"],"related_works":["https://openalex.org/W1979597421","https://openalex.org/W2007980826","https://openalex.org/W4245490552","https://openalex.org/W2061531152","https://openalex.org/W3002753104","https://openalex.org/W2077600819","https://openalex.org/W1587224694","https://openalex.org/W2042127053","https://openalex.org/W2142036596","https://openalex.org/W4238204885"],"abstract_inverted_index":{"Key":[0],"requirements":[1],"for":[2,145,208,269,277,306,335],"quantitative":[3],"structure-activity":[4],"relationship":[5],"(QSAR)":[6],"models":[7,82,287],"to":[8,104,128,137,221,241,246,292,329],"gain":[9],"acceptance":[10],"by":[11,77],"regulatory":[12],"authorities":[13],"include":[14],"a":[15,60,86,111,147,156,178,296,315,321],"defined":[16,52],"domain":[17],"of":[18,24,55,75,80,97,109,165,188,213,236,253,280],"applicability":[19],"(DA)":[20],"and":[21,27,62,89,191,217,250,288],"appropriate":[22],"measures":[23],"goodness-of-fit,":[25],"robustness,":[26],"predictivity.":[28],"Hence,":[29],"many":[30],"DA":[31,87,149,160],"metrics":[32],"have":[33,70],"been":[34],"developed":[35],"over":[36],"the":[37,56,73,95,107,118,129,135,143,163,205,214,223,227,234,243,251,261,264,278],"past":[38],"two":[39],"decades.":[40],"The":[41,257],"most":[42,50],"intuitive":[43],"are":[44,49],"perhaps":[45],"distance-to-model":[46,92],"metrics,":[47],"which":[48,169],"commonly":[51],"in":[53,177],"terms":[54],"mean":[57,244,283],"distance":[58,127,136,245],"between":[59],"molecule":[61,113,332],"its":[63,126],"k":[64],"nearest":[65],"training":[66,130,138,179,248],"samples.":[67],"Detailed":[68],"evaluations":[69],"shown":[71],"that":[72,106,134,200,260,274,324],"variance":[74,99,252],"predictions":[76],"an":[78,302],"ensemble":[79,98],"QSAR":[81,224,297],"may":[83,140],"serve":[84,141],"as":[85,142],"metric":[88,100,161],"can":[90,325],"outperform":[91],"metrics.":[93],"Intriguingly,":[94],"performance":[96],"has":[101],"led":[102],"researchers":[103],"conclude":[105],"error":[108,207,266,285],"predicting":[110],"new":[112,157],"does":[114,311],"not":[115,293,312],"depend":[116,313],"on":[117,125,314],"input":[119],"descriptors":[120,219],"or":[121],"machine-learning":[122,215,317,337],"methods":[123,216],"but":[124,299],"molecules.":[131],"This":[132],"implies":[133],"samples":[139],"basis":[144],"developing":[146],"high-performance":[148],"metric.":[150],"In":[151],"this":[152],"article,":[153],"we":[154,198,232],"introduce":[155],"Tanimoto":[158],"distance-based":[159],"called":[162],"sum":[164],"distance-weighted":[166],"contributions":[167,173],"(SDC),":[168],"takes":[170],"into":[171],"account":[172],"from":[174],"all":[175,209],"molecules":[176],"set.":[180],"Using":[181,226],"four":[182,192],"acute":[183,228],"chemical":[184],"toxicity":[185,229],"data":[186,196,210,230],"sets":[187,211],"varying":[189],"sizes":[190],"other":[193],"molecular":[194,218],"property":[195],"sets,":[197,231],"demonstrate":[199,273],"SDC":[201,275,310],"correlates":[202],"well":[203],"with":[204,239,263],"prediction":[206,237,265,298,333],"regardless":[212],"used":[220,328],"build":[222],"models.":[225],"compared":[233],"distribution":[235],"errors":[238,334],"respect":[240],"SDC,":[242],"k-nearest":[247],"samples,":[249],"random":[254],"forest":[255],"predictions.":[256],"results":[258],"showed":[259],"correlation":[262],"was":[267],"highest":[268],"SDC.":[270],"We":[271],"also":[272,300],"allows":[276],"development":[279],"robust":[281],"root":[282],"squared":[284],"(RMSE)":[286],"makes":[289],"it":[290,319],"possible":[291],"only":[294],"give":[295],"provide":[301],"individual":[303,331],"RMSE":[304],"estimate":[305,330],"each":[307],"molecule.":[308],"Because":[309],"specific":[316],"method,":[318],"represents":[320],"canonical":[322],"measure":[323],"be":[326],"widely":[327],"any":[336],"method.":[338]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
