{"id":"https://openalex.org/W2141738404","doi":"https://doi.org/10.1186/1758-2946-5-s1-p33","title":"Reliable estimation of externally validated prediction errors for QSAR models","display_name":"Reliable estimation of externally validated prediction errors for QSAR models","publication_year":2013,"publication_date":"2013-03-01","ids":{"openalex":"https://openalex.org/W2141738404","doi":"https://doi.org/10.1186/1758-2946-5-s1-p33","mag":"2141738404"},"language":"en","primary_location":{"id":"doi:10.1186/1758-2946-5-s1-p33","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-5-s1-p33","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-5-S1-P33","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-5-S1-P33","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063281959","display_name":"D\u00e9sir\u00e9e Baumann","orcid":null},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"D\u00e9sir\u00e9e Baumann","raw_affiliation_strings":["Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Beethovenstra\u00dfe 55, D-38106, Braunschweig, Germany","Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Braunschweig, Germany"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Beethovenstra\u00dfe 55, D-38106, Braunschweig, Germany","institution_ids":["https://openalex.org/I94509681"]},{"raw_affiliation_string":"Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Braunschweig, Germany","institution_ids":["https://openalex.org/I94509681"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027269400","display_name":"Knut Baumann","orcid":"https://orcid.org/0000-0001-9459-0045"},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Knut Baumann","raw_affiliation_strings":["Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Beethovenstra\u00dfe 55, D-38106, Braunschweig, Germany","Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Braunschweig, Germany"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Beethovenstra\u00dfe 55, D-38106, Braunschweig, Germany","institution_ids":["https://openalex.org/I94509681"]},{"raw_affiliation_string":"Institut f\u00fcr Medizinische und Pharmazeutische Chemie, Technische Universit\u00e4t Braunschweig, Braunschweig, Germany","institution_ids":["https://openalex.org/I94509681"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5063281959"],"corresponding_institution_ids":["https://openalex.org/I94509681"],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":0.0,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.11705526,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"5","issue":"S1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9580000042915344,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cross-validation","display_name":"Cross-validation","score":0.7966583967208862},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7045823335647583},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6889157891273499},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.6456779837608337},{"id":"https://openalex.org/keywords/model-selection","display_name":"Model selection","score":0.6056985855102539},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5957992076873779},{"id":"https://openalex.org/keywords/data-validation","display_name":"Data validation","score":0.5803476572036743},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5634582042694092},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.5345717072486877},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.5249124765396118},{"id":"https://openalex.org/keywords/model-validation","display_name":"Model validation","score":0.515579879283905},{"id":"https://openalex.org/keywords/test-data","display_name":"Test data","score":0.5085350275039673},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.4283655881881714},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3927334249019623},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3614664673805237},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.08719825744628906}],"concepts":[{"id":"https://openalex.org/C27181475","wikidata":"https://www.wikidata.org/wiki/Q541014","display_name":"Cross-validation","level":2,"score":0.7966583967208862},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7045823335647583},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6889157891273499},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.6456779837608337},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.6056985855102539},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5957992076873779},{"id":"https://openalex.org/C92446256","wikidata":"https://www.wikidata.org/wiki/Q3306762","display_name":"Data validation","level":2,"score":0.5803476572036743},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5634582042694092},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.5345717072486877},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.5249124765396118},{"id":"https://openalex.org/C3019813237","wikidata":"https://www.wikidata.org/wiki/Q65089264","display_name":"Model validation","level":2,"score":0.515579879283905},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.5085350275039673},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.4283655881881714},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3927334249019623},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3614664673805237},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.08719825744628906},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/1758-2946-5-s1-p33","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-5-s1-p33","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-5-S1-P33","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmh:oai:europepmc.org:2605454","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3606159","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1758-2946-5-s1-p33","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-5-s1-p33","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-5-S1-P33","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.47999998927116394,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2141738404.pdf","grobid_xml":"https://content.openalex.org/works/W2141738404.grobid-xml"},"referenced_works_count":2,"referenced_works":["https://openalex.org/W2023130417","https://openalex.org/W2090790364"],"related_works":["https://openalex.org/W816105089","https://openalex.org/W2100523380","https://openalex.org/W4254524906","https://openalex.org/W3011444647","https://openalex.org/W3048572280","https://openalex.org/W2095987352","https://openalex.org/W2044298310","https://openalex.org/W4249858832","https://openalex.org/W3207949591","https://openalex.org/W3035752049"],"abstract_inverted_index":{"In":[0,202],"most":[1],"cases":[2],"of":[3,30,36,44,63,197,224,271,281,287],"QSAR":[4],"modelling":[5,40],"the":[6,37,61,66,89,92,130,138,153,185,203,221,238,282,301],"final":[7],"model":[8,51,77,82,188,210,258],"used":[9,235],"to":[10,20,71,159,183,215,236,253,299,307],"make":[11],"predictions,":[12],"is":[13,53,85,125,158,190,207,248,265],"not":[14,74,172],"known":[15],"a":[16,24,55,86,109,120,176,309],"priori":[17],"but":[18,79],"has":[19,70],"be":[21,72,98,160,173,181,292],"selected":[22,240],"in":[23,57,88,162,220,305],"data":[25,68,95,111,123,132,140,154,166,228],"driven":[26],"fashion":[27],"(e.g.":[28],"selection":[29,35,189,211],"principal":[31],"components,":[32],"variable":[33,279],"selection,":[34],"best":[38],"mathematical":[39],"technique).":[41],"Reliable":[42],"estimation":[43],"externally":[45],"validated":[46],"prediction":[47,255,283],"errors":[48,256],"under":[49,257],"this":[50,244],"uncertainty":[52],"still":[54,84],"challenge":[56],"chemoinformatics.":[58],"To":[59],"fulfil":[60],"standards":[62],"external":[64],"validation,":[65],"test":[67,94,110,122,131,142,227,302],"set":[69,96,112,124,126,145,268,303],"independent":[73,93],"only":[75],"from":[76,81],"building":[78],"also":[80,191],"selection.\r\n\r\nThere":[83],"controversy":[87],"literature":[90],"how":[91,101,262,298],"should":[97,104],"chosen":[99],"and":[100,128,143,289,294],"large":[102],"it":[103,157,273],"be.":[105],"For":[106],"setting":[107],"aside":[108,127],"there":[113],"are":[114,133,199,230,234,296],"basically":[115],"two":[116,195],"different":[117,226],"options:":[118],"1)":[119],"single":[121],"2)":[129],"generated":[134,231],"by":[135,193],"repeatedly":[136,232],"partitioning":[137],"available":[139],"into":[141],"training":[144],"partitions":[146],"-":[147],"i.e.":[148],"cross-validation.":[149],"Since":[150],"cross-validation":[151,169,177,194,198,206,225,247,264],"uses":[152],"more":[155],"efficiently,":[156],"preferred":[161],"particular":[163],"for":[164,209,250],"small":[165],"sets.\r\n\r\nThe":[167],"aforementioned":[168],"step":[170,178],"must":[171],"confused":[174],"with":[175],"that":[179,233],"might":[180],"necessary":[182,200],"select":[184],"model!":[186],"If":[187],"done":[192],"loops":[196],"[1].":[201],"inner":[204],"loop,":[205],"employed":[208],"[2]":[212],"(also":[213],"referred":[214],"as":[216],"internal":[217],"validation)":[218],"while":[219],"outer":[222],"loop":[223],"sets":[229],"assess":[237],"readily":[239],"models":[241],"(external":[242],"validation).\r\n\r\nIn":[243],"contribution":[245],"double":[246,263],"evaluated":[249],"its":[251],"ability":[252],"estimate":[254],"uncertainty.":[259],"Depending":[260],"on":[261],"parameterized":[266],"(test":[267],"size,":[269],"number":[270],"repetitions),":[272],"either":[274],"yields":[275],"biased":[276],"or":[277],"highly":[278],"estimates":[280],"error.":[284],"The":[285],"sources":[286],"bias":[288],"variability":[290],"will":[291],"highlighted":[293],"recommendations":[295],"provided":[297],"determine":[300],"size":[304],"order":[306],"obtain":[308],"favourable":[310],"bias-variability":[311],"trade-off.":[312]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
