{"id":"https://openalex.org/W1994126845","doi":"https://doi.org/10.1021/ci9903049","title":"Analysis of a Large Structure/Biological Activity Data Set Using Recursive Partitioning","display_name":"Analysis of a Large Structure/Biological Activity Data Set Using Recursive Partitioning","publication_year":1999,"publication_date":"1999-10-30","ids":{"openalex":"https://openalex.org/W1994126845","doi":"https://doi.org/10.1021/ci9903049","mag":"1994126845","pmid":"https://pubmed.ncbi.nlm.nih.gov/10614024"},"language":"en","primary_location":{"id":"doi:10.1021/ci9903049","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci9903049","pdf_url":null,"source":{"id":"https://openalex.org/S171559003","display_name":"Journal of Chemical Information and Computer Sciences","issn_l":"0095-2338","issn":["0095-2338","1520-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Computer Sciences","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032585517","display_name":"Andrew Rusinko","orcid":null},"institutions":[{"id":"https://openalex.org/I1309191912","display_name":"Research Triangle Park Foundation","ror":"https://ror.org/03eqttr49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1309191912"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Andrew Rusinko","raw_affiliation_strings":["Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709"],"affiliations":[{"raw_affiliation_string":"Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709","institution_ids":["https://openalex.org/I1309191912"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035114744","display_name":"Mark W. Farmen","orcid":null},"institutions":[{"id":"https://openalex.org/I1309191912","display_name":"Research Triangle Park Foundation","ror":"https://ror.org/03eqttr49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1309191912"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark W. Farmen","raw_affiliation_strings":["Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709"],"affiliations":[{"raw_affiliation_string":"Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709","institution_ids":["https://openalex.org/I1309191912"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017075939","display_name":"Christophe G Lambert","orcid":"https://orcid.org/0000-0003-1994-2893"},"institutions":[{"id":"https://openalex.org/I1309191912","display_name":"Research Triangle Park Foundation","ror":"https://ror.org/03eqttr49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1309191912"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christophe G. Lambert","raw_affiliation_strings":["Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709"],"affiliations":[{"raw_affiliation_string":"Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709","institution_ids":["https://openalex.org/I1309191912"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104058023","display_name":"Paul L. Brown","orcid":null},"institutions":[{"id":"https://openalex.org/I1309191912","display_name":"Research Triangle Park Foundation","ror":"https://ror.org/03eqttr49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1309191912"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul L. Brown","raw_affiliation_strings":["Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709"],"affiliations":[{"raw_affiliation_string":"Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709","institution_ids":["https://openalex.org/I1309191912"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101659406","display_name":"S. Stanley Young","orcid":"https://orcid.org/0000-0002-7084-0932"},"institutions":[{"id":"https://openalex.org/I1309191912","display_name":"Research Triangle Park Foundation","ror":"https://ror.org/03eqttr49","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1309191912"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. Stanley Young","raw_affiliation_strings":["Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709"],"affiliations":[{"raw_affiliation_string":"Research Information Systems, Glaxo Wellcome Inc., Five Moore Drive, Research Triangle Park, North Carolina 27709","institution_ids":["https://openalex.org/I1309191912"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5032585517"],"corresponding_institution_ids":["https://openalex.org/I1309191912"],"apc_list":null,"apc_paid":null,"fwci":16.1172,"has_fulltext":false,"cited_by_count":185,"citation_normalized_percentile":{"value":0.99585027,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"39","issue":"6","first_page":"1017","last_page":"1026"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6804744005203247},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.673879861831665},{"id":"https://openalex.org/keywords/recursive-partitioning","display_name":"Recursive partitioning","score":0.6490135192871094},{"id":"https://openalex.org/keywords/biological-data","display_name":"Biological data","score":0.5367172360420227},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5267015099525452},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4892830550670624},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.423051118850708},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.40577638149261475},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.24835294485092163},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22560352087020874},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.19679424166679382},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.09012168645858765}],"concepts":[{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6804744005203247},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.673879861831665},{"id":"https://openalex.org/C137345334","wikidata":"https://www.wikidata.org/wiki/Q7303350","display_name":"Recursive partitioning","level":2,"score":0.6490135192871094},{"id":"https://openalex.org/C201797286","wikidata":"https://www.wikidata.org/wiki/Q4914986","display_name":"Biological data","level":2,"score":0.5367172360420227},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5267015099525452},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4892830550670624},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.423051118850708},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40577638149261475},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.24835294485092163},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22560352087020874},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.19679424166679382},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.09012168645858765},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D004345","descriptor_name":"Drug Industry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004345","descriptor_name":"Drug Industry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004345","descriptor_name":"Drug Industry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020650","descriptor_name":"Combinatorial Chemistry Techniques","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020650","descriptor_name":"Combinatorial Chemistry Techniques","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020650","descriptor_name":"Combinatorial Chemistry Techniques","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":3,"locations":[{"id":"doi:10.1021/ci9903049","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci9903049","pdf_url":null,"source":{"id":"https://openalex.org/S171559003","display_name":"Journal of Chemical Information and Computer Sciences","issn_l":"0095-2338","issn":["0095-2338","1520-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Computer Sciences","raw_type":"journal-article"},{"id":"pmid:10614024","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/10614024","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and computer sciences","raw_type":null},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.94.8837","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.94.8837","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.goldenhelix.com/download/pdfs/Rusinko.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6000000238418579,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W578214175","https://openalex.org/W1542150362","https://openalex.org/W1568011753","https://openalex.org/W1594031697","https://openalex.org/W1963717906","https://openalex.org/W1966704112","https://openalex.org/W1968379359","https://openalex.org/W1972206604","https://openalex.org/W1973055726","https://openalex.org/W1977503005","https://openalex.org/W1981832881","https://openalex.org/W1985459162","https://openalex.org/W1986170186","https://openalex.org/W1989141250","https://openalex.org/W1990351156","https://openalex.org/W1991157450","https://openalex.org/W1991453563","https://openalex.org/W1999968212","https://openalex.org/W2001877566","https://openalex.org/W2005685204","https://openalex.org/W2006015657","https://openalex.org/W2006322600","https://openalex.org/W2006661331","https://openalex.org/W2008764714","https://openalex.org/W2014731568","https://openalex.org/W2015561117","https://openalex.org/W2016979469","https://openalex.org/W2021748110","https://openalex.org/W2022885801","https://openalex.org/W2028206557","https://openalex.org/W2031415145","https://openalex.org/W2037261712","https://openalex.org/W2038268267","https://openalex.org/W2043979050","https://openalex.org/W2046311259","https://openalex.org/W2046482449","https://openalex.org/W2047218048","https://openalex.org/W2051802332","https://openalex.org/W2059280933","https://openalex.org/W2070586654","https://openalex.org/W2092194848","https://openalex.org/W2095534911","https://openalex.org/W2097132534","https://openalex.org/W2126359798","https://openalex.org/W2126843316","https://openalex.org/W2127644822","https://openalex.org/W2146143186","https://openalex.org/W2147043735","https://openalex.org/W2150104128","https://openalex.org/W2151079386","https://openalex.org/W2168133763","https://openalex.org/W2291125829","https://openalex.org/W2330820318","https://openalex.org/W2951116435","https://openalex.org/W2951679156","https://openalex.org/W4233014035"],"related_works":["https://openalex.org/W2523220573","https://openalex.org/W2083125347","https://openalex.org/W2047930883","https://openalex.org/W2063942697","https://openalex.org/W1978565033","https://openalex.org/W2329625923","https://openalex.org/W4200279211","https://openalex.org/W1990621789","https://openalex.org/W2088652195","https://openalex.org/W2594414941"],"abstract_inverted_index":{"Combinatorial":[0],"chemistry":[1],"and":[2,20,110,205],"high-throughput":[3],"screening":[4],"are":[5,27,144,210],"revolutionizing":[6],"the":[7,13,81,84,105,123,164,179,198],"process":[8],"of":[9,18,23,60,76,83,99,115,125,129,131,140,154,160,176,207],"lead":[10],"discovery":[11],"in":[12,54,178,187],"pharmaceutical":[14],"industry.":[15],"Large":[16],"numbers":[17],"structures":[19,57,132],"vast":[21],"quantities":[22],"biological":[24,89],"assay":[25],"data":[26,85,90,97,181],"quickly":[28],"being":[29],"accumulated,":[30],"overwhelming":[31],"traditional":[32],"structure/activity":[33,193],"relationship":[34,194],"(SAR)":[35],"analysis":[36,152,162],"technologies.":[37],"Recursive":[38],"partitioning":[39],"is":[40,66,163],"a":[41,67,201],"method":[42,119],"for":[43,174],"statistically":[44],"determining":[45],"rules":[46,87,109,173],"that":[47,183,197],"classify":[48],"objects":[49],"into":[50,58],"similar":[51,63],"categories":[52],"or,":[53],"this":[55,77,155,161,208],"case,":[56],"groups":[59],"molecules":[61],"with":[62,122,150,168],"potencies.":[64],"SCAM":[65],"computer":[68],"program":[69],"implemented":[70],"to":[71,112,138,148,166],"make":[72],"extremely":[73],"efficient":[74],"use":[75],"methodology.":[78],"Depending":[79],"on":[80],"size":[82],"set,":[86],"explaining":[88],"can":[91,133],"be":[92,134,185],"determined":[93],"interactively.":[94],"An":[95,157],"example":[96],"set":[98,182],"1650":[100],"monoamine":[101],"oxidase":[102],"inhibitors":[103],"exemplifies":[104],"method,":[106],"yielding":[107],"substructural":[108],"leading":[111],"general":[113],"classifications":[114],"these":[116],"inhibitors.":[117],"The":[118],"scales":[120],"linearly":[121],"number":[124],"descriptors,":[126],"so":[127],"hundreds":[128],"thousands":[130,137],"analyzed":[135],"utilizing":[136],"millions":[139],"molecular":[141],"descriptors.":[142],"There":[143],"currently":[145],"no":[146],"methods":[147,195],"deal":[149,167],"statistical":[151],"problems":[153],"size.":[156],"important":[158],"aspect":[159],"ability":[165],"mixtures,":[169],"i.e.,":[170],"identify":[171],"SAR":[172],"classes":[175],"compounds":[177,199],"same":[180],"might":[184],"binding":[186],"different":[188],"ways.":[189],"Most":[190],"current":[191],"quantitative":[192],"require":[196],"follow":[200],"single":[202],"mechanism.":[203],"Advantages":[204],"limitations":[206],"methodology":[209],"presented.":[211]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":8}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
