{"id":"https://openalex.org/W1990919689","doi":"https://doi.org/10.1021/ci500264r","title":"Are Bigger Data Sets Better for Machine Learning? Fusing Single-Point and Dual-Event Dose Response Data for Mycobacterium tuberculosis","display_name":"Are Bigger Data Sets Better for Machine Learning? Fusing Single-Point and Dual-Event Dose Response Data for Mycobacterium tuberculosis","publication_year":2014,"publication_date":"2014-07-17","ids":{"openalex":"https://openalex.org/W1990919689","doi":"https://doi.org/10.1021/ci500264r","mag":"1990919689","pmid":"https://pubmed.ncbi.nlm.nih.gov/24968215","pmcid":"https://www.ncbi.nlm.nih.gov/pmc/articles/4951206"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci500264r","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-960X","1549-9596"],"is_oa":false,"is_in_doaj":false,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://europepmc.org/articles/pmc4951206?pdf=render","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073973321","display_name":"Sean Ekins","orcid":"https://orcid.org/0000-0002-5691-5790"},"institutions":[{"id":"https://openalex.org/I4210148032","display_name":"Collaborations Pharmaceuticals (United States)","ror":"https://ror.org/04m718665","country_code":"US","type":"company","lineage":["https://openalex.org/I4210148032"]},{"id":"https://openalex.org/I4210147836","display_name":"Collaborative Drug Discovery (United States)","ror":"https://ror.org/04b4sq284","country_code":"US","type":"company","lineage":["https://openalex.org/I4210147836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sean Ekins","raw_affiliation_string":"Collaborations in Chemistry, 5616 Hilltop\rNeedmore Road, Fuquay-Varina, North Carolina 27526, United States; Collaborative Drug Discovery, 1633\rBayshore Highway, Suite 342, Burlingame, California 94010, United States","raw_affiliation_strings":["Collaborations in Chemistry, 5616 Hilltop\rNeedmore Road, Fuquay-Varina, North Carolina 27526, United States","Collaborative Drug Discovery, 1633\rBayshore Highway, Suite 342, Burlingame, California 94010, United States"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044700909","display_name":"Joel S. Freundlich","orcid":"https://orcid.org/0000-0002-3411-3455"},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joel S. Freundlich","raw_affiliation_string":"Department of Medicine, Center for Emerging and Reemerging Pathogens and Department of Pharmacology & Physiology, Rutgers University\u2212New Jersey Medical School, 185 South Orange Avenue, Newark, New Jersey 07103, United States","raw_affiliation_strings":["Department of Medicine, Center for Emerging and Reemerging Pathogens and Department of Pharmacology & Physiology, Rutgers University\u2212New Jersey Medical School, 185 South Orange Avenue, Newark, New Jersey 07103, United States"]},{"author_position":"last","author":{"id":"https://openalex.org/A5066715892","display_name":"Robert C. Reynolds","orcid":null},"institutions":[{"id":"https://openalex.org/I32389192","display_name":"University of Alabama at Birmingham","ror":"https://ror.org/008s83205","country_code":"US","type":"education","lineage":["https://openalex.org/I2800507078","https://openalex.org/I32389192"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Robert C. Reynolds","raw_affiliation_string":"Department#R#of Chemistry, College of Arts and Sciences, University of Alabama at Birmingham, 1530 3rd Avenue South, Birmingham, Alabama 35294-1240, United States","raw_affiliation_strings":["Department#R#of Chemistry, College of Arts and Sciences, University of Alabama at Birmingham, 1530 3rd Avenue South, Birmingham, Alabama 35294-1240, United States"]}],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":37,"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"54","issue":"7","first_page":"2157","last_page":"2165"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Methods in Drug Discovery","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Methods in Drug Discovery","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12255","display_name":"Immunogenicity of Biosimilar Therapeutics in Drug Development","score":0.9939,"subfield":{"id":"https://openalex.org/subfields/2403","display_name":"Immunology"},"field":{"id":"https://openalex.org/fields/24","display_name":"Immunology and Microbiology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10038","display_name":"Tuberculosis","score":0.9924,"subfield":{"id":"https://openalex.org/subfields/2725","display_name":"Infectious Diseases"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"keyword":"bigger data","score":0.4664},{"keyword":"machine learning","score":0.4432},{"keyword":"mycobacterium tuberculosis","score":0.3209},{"keyword":"single-point","score":0.25},{"keyword":"dual-event","score":0.25}],"concepts":[{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.61051786},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.5550834},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5461692},{"id":"https://openalex.org/C2779466056","wikidata":"https://www.wikidata.org/wiki/Q107630651","display_name":"Time point","level":2,"score":0.5419756},{"id":"https://openalex.org/C2777975735","wikidata":"https://www.wikidata.org/wiki/Q130971","display_name":"Mycobacterium tuberculosis","level":3,"score":0.5316613},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.498765},{"id":"https://openalex.org/C58471807","wikidata":"https://www.wikidata.org/wiki/Q327120","display_name":"Receiver operating characteristic","level":2,"score":0.49557602},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46689212},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4656893},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44038653},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43359053},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42301804},{"id":"https://openalex.org/C2781069245","wikidata":"https://www.wikidata.org/wiki/Q12204","display_name":"Tuberculosis","level":2,"score":0.4082058},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.20455146},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.10534206},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.104504645},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000995","descriptor_name":"Antitubercular Agents","qualifier_ui":"Q000494","qualifier_name":"pharmacology","is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D004353","descriptor_name":"Drug Evaluation, Preclinical","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D048088","descriptor_name":"Informatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D009169","descriptor_name":"Mycobacterium tuberculosis","qualifier_ui":"Q000187","qualifier_name":"drug effects","is_major_topic":true},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000995","descriptor_name":"Antitubercular Agents","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000995","descriptor_name":"Antitubercular Agents","qualifier_ui":"Q000633","qualifier_name":"toxicity","is_major_topic":false},{"descriptor_ui":"D001499","descriptor_name":"Bayes Theorem","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D002522","descriptor_name":"Chlorocebus aethiops","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004305","descriptor_name":"Dose-Response Relationship, Drug","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004353","descriptor_name":"Drug Evaluation, Preclinical","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D048088","descriptor_name":"Informatics","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009169","descriptor_name":"Mycobacterium tuberculosis","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014709","descriptor_name":"Vero Cells","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci500264r","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-960X","1549-9596"],"is_oa":false,"is_in_doaj":false,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://europepmc.org/articles/pmc4951206","pdf_url":"https://europepmc.org/articles/pmc4951206?pdf=render","source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":["European Bioinformatics Institute"],"type":"repository"},"license":null,"version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4951206","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/24968215","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://europepmc.org/articles/pmc4951206","pdf_url":"https://europepmc.org/articles/pmc4951206?pdf=render","source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":["European Bioinformatics Institute"],"type":"repository"},"license":null,"version":"acceptedVersion","is_accepted":true,"is_published":false},"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.72,"id":"https://metadata.un.org/sdg/3"}],"grants":[{"funder":"https://openalex.org/F4320306137","funder_display_name":"Bill and Melinda Gates Foundation","award_id":null}],"referenced_works_count":57,"referenced_works":["https://openalex.org/W1964141703","https://openalex.org/W1967396133","https://openalex.org/W1968135993","https://openalex.org/W1974242110","https://openalex.org/W1981066521","https://openalex.org/W1984325804","https://openalex.org/W1984678368","https://openalex.org/W1986106712","https://openalex.org/W1986602441","https://openalex.org/W1993795323","https://openalex.org/W1996194136","https://openalex.org/W2003537793","https://openalex.org/W2007560618","https://openalex.org/W2019154446","https://openalex.org/W2020973204","https://openalex.org/W2020983758","https://openalex.org/W2031441006","https://openalex.org/W2034080889","https://openalex.org/W2035288789","https://openalex.org/W2035776068","https://openalex.org/W2040135138","https://openalex.org/W2041253429","https://openalex.org/W2041610798","https://openalex.org/W2046613566","https://openalex.org/W2048080607","https://openalex.org/W2049773909","https://openalex.org/W2052902229","https://openalex.org/W2059750112","https://openalex.org/W2060531713","https://openalex.org/W2077249477","https://openalex.org/W2080026691","https://openalex.org/W2081770014","https://openalex.org/W2085684476","https://openalex.org/W2091356402","https://openalex.org/W2104780143","https://openalex.org/W2106374535","https://openalex.org/W2107184926","https://openalex.org/W2113972754","https://openalex.org/W2115544494","https://openalex.org/W2116652199","https://openalex.org/W2119410200","https://openalex.org/W2124462881","https://openalex.org/W2125852843","https://openalex.org/W2136905362","https://openalex.org/W2140716928","https://openalex.org/W2142602210","https://openalex.org/W2142733912","https://openalex.org/W2153783740","https://openalex.org/W2155741020","https://openalex.org/W2158023121","https://openalex.org/W2158658436","https://openalex.org/W2161459134","https://openalex.org/W2163576609","https://openalex.org/W2167773607","https://openalex.org/W2168447130","https://openalex.org/W2171660521","https://openalex.org/W2402340532"],"related_works":["https://openalex.org/W2345432972","https://openalex.org/W2970784617","https://openalex.org/W4385649027","https://openalex.org/W2217963778","https://openalex.org/W2129882004","https://openalex.org/W4303685026","https://openalex.org/W1980276147","https://openalex.org/W3187081201","https://openalex.org/W1995646291","https://openalex.org/W2140519023"],"ngrams_url":"https://api.openalex.org/works/W1990919689/ngrams","abstract_inverted_index":{"Tuberculosis":[0],"is":[1,16],"a":[2,131,147],"major,":[3],"neglected":[4],"disease":[5],"for":[6,90,120,187,239],"which":[7,85],"the":[8,26,70,77,126,141,171,178,182,200],"quest":[9],"to":[10,60,199,223],"find":[11],"new":[12],"treatments":[13],"continues.":[14],"There":[15],"an":[17],"abundance":[18],"of":[19,73,135,150,177,202],"data":[20,49,75,83,89,118,123,133,160,167],"from":[21,39,105,125,140,154],"large":[22,71],"phenotypic":[23],"screens":[24],"in":[25,45],"public":[27],"domain":[28],"against":[29],"Mycobacterium":[30],"tuberculosis":[31],"(Mtb).":[32],"Since":[33],"machine":[34,58],"learning":[35,59],"methods":[36],"can":[37,64],"learn":[38],"past":[40],"data,":[41],"we":[42,63],"were":[43],"interested":[44],"addressing":[46],"whether":[47,62],"more":[48],"builds":[50],"better":[51],"models.":[52],"We":[53,99,129],"now":[54],"describe":[55],"using":[56],"Bayesian":[57],"assess":[61],"improve":[65],"our":[66],"models":[67,103,179,189,206,217],"by":[68],"combining":[69,162],"quantities":[72],"single-point":[74,110,163],"with":[76,164,219,230],"much":[78],"smaller":[79,148,204],"(higher":[80],"quality)":[81],"dual-event":[82,108,112,165,205],"sets,":[84],"use":[86],"both":[87,91],"dose\u2013response":[88,113,166],"whole-cell":[92],"antitubercular":[93],"activity":[94],"and":[95,111,137,211],"Vero":[96],"cell":[97],"cytotoxicity.":[98],"have":[100,237],"evaluated":[101],"12":[102],"ranging":[104],"different":[106],"single-point,":[107],"dose\u2013response,":[109],"as":[114,116,144,146,156,225,227],"well":[115,145],"combined":[117],"sets":[119,124],"three":[121],"distinct":[122],"same":[127,142],"laboratory.":[128],"used":[130],"fourth":[132],"set":[134,149],"active":[136,152],"inactive":[138],"compounds":[139,153,221],"group":[143],"177":[151],"GlaxoSmithKline":[155],"test":[157],"sets.":[158],"Our":[159,235],"suggest":[161],"does":[168],"not":[169],"diminish":[170],"internal":[172],"or":[173],"external":[174,194,212],"predictive":[175,226],"ability":[176],"based":[180,247],"on":[181,248],"receiver":[183],"operator":[184],"curve":[185],"(ROC)":[186],"these":[188],"(internal":[190,207],"ROC":[191,195,208,213],"range":[192,196,209],"0.83\u20130.91,":[193],"0.62\u20130.83)":[197],"compared":[198],"orders":[201],"magnitude":[203],"0.6\u20130.83":[210],"0.54\u20130.83).":[214],"In":[215],"conclusion,":[216],"developed":[218],"1200\u20135000":[220],"appear":[222],"be":[224],"those":[228],"generated":[229],"25":[231],"000\u2013350":[232],"000":[233],"molecules.":[234],"results":[236],"implications":[238],"justifying":[240],"further":[241],"high-throughput":[242],"screening":[243],"versus":[244],"focused":[245],"testing":[246],"model":[249],"predictions.":[250]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1990919689","counts_by_year":[{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":8},{"year":2014,"cited_by_count":1}],"updated_date":"2024-03-26T00:23:14.930987","created_date":"2016-06-24"}