{"id":"https://openalex.org/W2125109129","doi":"https://doi.org/10.1021/ci049860f","title":"The Reduced Graph Descriptor in Virtual Screening and Data-Driven Clustering of High-Throughput Screening Data","display_name":"The Reduced Graph Descriptor in Virtual Screening and Data-Driven Clustering of High-Throughput Screening Data","publication_year":2004,"publication_date":"2004-09-04","ids":{"openalex":"https://openalex.org/W2125109129","doi":"https://doi.org/10.1021/ci049860f","mag":"2125109129","pmid":"https://pubmed.ncbi.nlm.nih.gov/15554685"},"language":"en","primary_location":{"id":"doi:10.1021/ci049860f","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci049860f","pdf_url":null,"source":{"id":"https://openalex.org/S171559003","display_name":"Journal of Chemical Information and Computer Sciences","issn_l":"0095-2338","issn":["0095-2338","1520-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Computer Sciences","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046590455","display_name":"Gavin Harper","orcid":null},"institutions":[{"id":"https://openalex.org/I188950975","display_name":"GlaxoSmithKline (United Kingdom)","ror":"https://ror.org/01xsqw823","country_code":"GB","type":"company","lineage":["https://openalex.org/I188950975"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"G. Harper","raw_affiliation_strings":["GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom"],"affiliations":[{"raw_affiliation_string":"GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom","institution_ids":["https://openalex.org/I188950975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058775651","display_name":"Gianpaolo Bravi","orcid":null},"institutions":[{"id":"https://openalex.org/I188950975","display_name":"GlaxoSmithKline (United Kingdom)","ror":"https://ror.org/01xsqw823","country_code":"GB","type":"company","lineage":["https://openalex.org/I188950975"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"G. S. Bravi","raw_affiliation_strings":["GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom"],"affiliations":[{"raw_affiliation_string":"GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom","institution_ids":["https://openalex.org/I188950975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079075074","display_name":"Stephen D. Pickett","orcid":"https://orcid.org/0000-0002-0958-9830"},"institutions":[{"id":"https://openalex.org/I188950975","display_name":"GlaxoSmithKline (United Kingdom)","ror":"https://ror.org/01xsqw823","country_code":"GB","type":"company","lineage":["https://openalex.org/I188950975"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"S. D. Pickett","raw_affiliation_strings":["GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom"],"affiliations":[{"raw_affiliation_string":"GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom","institution_ids":["https://openalex.org/I188950975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075541590","display_name":"Jameed Hussain","orcid":null},"institutions":[{"id":"https://openalex.org/I188950975","display_name":"GlaxoSmithKline (United Kingdom)","ror":"https://ror.org/01xsqw823","country_code":"GB","type":"company","lineage":["https://openalex.org/I188950975"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"J. Hussain","raw_affiliation_strings":["GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom"],"affiliations":[{"raw_affiliation_string":"GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom","institution_ids":["https://openalex.org/I188950975"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045116564","display_name":"Darren V. S. Green","orcid":"https://orcid.org/0000-0001-9063-2754"},"institutions":[{"id":"https://openalex.org/I188950975","display_name":"GlaxoSmithKline (United Kingdom)","ror":"https://ror.org/01xsqw823","country_code":"GB","type":"company","lineage":["https://openalex.org/I188950975"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"D. V. S. Green","raw_affiliation_strings":["GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom"],"affiliations":[{"raw_affiliation_string":"GlaxoSmithKline, Gunnels Wood Road, Stevenage SG1 2NY, United Kingdom","institution_ids":["https://openalex.org/I188950975"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5046590455"],"corresponding_institution_ids":["https://openalex.org/I188950975"],"apc_list":null,"apc_paid":null,"fwci":2.3995,"has_fulltext":false,"cited_by_count":85,"citation_normalized_percentile":{"value":0.88566495,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"44","issue":"6","first_page":"2145","last_page":"2156"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9707000255584717,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9279999732971191,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7148383855819702},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6848684549331665},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.6009247899055481},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5464739203453064},{"id":"https://openalex.org/keywords/high-throughput-screening","display_name":"High-throughput screening","score":0.4643678069114685},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4563252925872803},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.289675772190094},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2050304412841797},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.14874860644340515},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.09060618281364441}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7148383855819702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6848684549331665},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.6009247899055481},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5464739203453064},{"id":"https://openalex.org/C51323132","wikidata":"https://www.wikidata.org/wiki/Q626251","display_name":"High-throughput screening","level":2,"score":0.4643678069114685},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4563252925872803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.289675772190094},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2050304412841797},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.14874860644340515},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.09060618281364441},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1021/ci049860f","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci049860f","pdf_url":null,"source":{"id":"https://openalex.org/S171559003","display_name":"Journal of Chemical Information and Computer Sciences","issn_l":"0095-2338","issn":["0095-2338","1520-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Computer Sciences","raw_type":"journal-article"},{"id":"pmid:15554685","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/15554685","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and computer sciences","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5299999713897705,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W938539187","https://openalex.org/W1595350250","https://openalex.org/W1967436230","https://openalex.org/W1978811796","https://openalex.org/W1981214699","https://openalex.org/W1987752375","https://openalex.org/W1999054993","https://openalex.org/W2005685204","https://openalex.org/W2020536145","https://openalex.org/W2026909852","https://openalex.org/W2026910177","https://openalex.org/W2060531713","https://openalex.org/W2064798225","https://openalex.org/W2074697485","https://openalex.org/W2081050523","https://openalex.org/W2089108696","https://openalex.org/W2121216262","https://openalex.org/W2203775767"],"related_works":["https://openalex.org/W2136583354","https://openalex.org/W2111238207","https://openalex.org/W2804364458","https://openalex.org/W580487332","https://openalex.org/W2097654801","https://openalex.org/W1519879345","https://openalex.org/W3150498631","https://openalex.org/W2371195977","https://openalex.org/W2768489290","https://openalex.org/W2354872674"],"abstract_inverted_index":{"Virtual":[0],"screening":[1,4,53],"and":[2,40,89,93,128,196],"high-throughput":[3,52],"are":[5],"two":[6],"major":[7],"components":[8],"of":[9,45,51,73,82,102,146,170,187],"lead":[10],"discovery":[11],"within":[12],"the":[13,49,63,80,83,100],"pharmaceutical":[14],"industry.":[15],"In":[16,75],"this":[17,76,174],"paper":[18,77],"we":[19,78,116,179],"describe":[20,41,129,166],"improvements":[21],"to":[22,86,161],"previously":[23],"published":[24],"methods":[25,56],"for":[26,57,98],"similarity":[27,60,101,114],"searching":[28,61],"with":[29,32,137,152],"reduced":[30,46,58,64,84,103,126,171],"graphs,":[31],"a":[33,42,71,95,107,130,167,177,191],"particular":[34,192],"focus":[35],"on":[36,106],"ligand-based":[37],"virtual":[38],"screening,":[39],"novel":[43,168],"use":[44,169],"graphs":[47,65,104,127,141,172],"in":[48,150,173,198],"clustering":[50],"data.":[54,164],"Literature":[55],"graph":[59,85],"encode":[62],"as":[66],"binary":[67],"fingerprints,":[68],"which":[69],"has":[70],"number":[72],"issues.":[74],"extend":[79],"definition":[81],"include":[87],"positively":[88],"negatively":[90],"ionizable":[91],"groups":[92],"introduce":[94],"new":[96],"method":[97,178],"measuring":[99],"based":[105],"weighted":[108],"edit":[109],"distance.":[110],"Moving":[111],"beyond":[112],"simple":[113],"searching,":[115],"show":[117],"how":[118],"more":[119],"flexible":[120],"queries":[121],"can":[122],"be":[123],"built":[124],"using":[125],"database":[131],"system":[132],"that":[133,184],"allows":[134],"iterative":[135],"querying":[136],"multiple":[138],"representations.":[139],"Reduced":[140],"capture":[142],"many":[143],"important":[144],"features":[145],"ligand-receptor":[147],"interactions":[148],"and,":[149],"conjunction":[151],"other":[153],"whole":[154,193],"molecule":[155,194],"descriptors,":[156],"provide":[157],"an":[158],"informative":[159],"way":[160],"review":[162],"HTS":[163],"We":[165],"context,":[175],"introducing":[176],"have":[180],"termed":[181],"data-driven":[182],"clustering,":[183],"identifies":[185],"clusters":[186],"molecules":[188],"represented":[189],"by":[190],"descriptor":[195],"enriched":[197],"active":[199],"compounds.":[200]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":3}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
