{"id":"https://openalex.org/W2066810295","doi":"https://doi.org/10.1021/ci050370c","title":"Mining a Chemical Database for Fragment Co-occurrence:\u2009 Discovery of \u201cChemical Clich\u00e9s\u201d","display_name":"Mining a Chemical Database for Fragment Co-occurrence:\u2009 Discovery of \u201cChemical Clich\u00e9s\u201d","publication_year":2006,"publication_date":"2006-01-27","ids":{"openalex":"https://openalex.org/W2066810295","doi":"https://doi.org/10.1021/ci050370c","mag":"2066810295","pmid":"https://pubmed.ncbi.nlm.nih.gov/16562983"},"language":"en","primary_location":{"id":"doi:10.1021/ci050370c","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci050370c","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047891732","display_name":"Eric-Wubbo Lameijer","orcid":"https://orcid.org/0000-0002-0397-0710"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Eric-Wubbo Lameijer","raw_affiliation_strings":["Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany"],"affiliations":[{"raw_affiliation_string":"Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany","institution_ids":["https://openalex.org/I121797337"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012010960","display_name":"Joost N. Kok","orcid":"https://orcid.org/0000-0002-7352-1400"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Joost N. Kok","raw_affiliation_strings":["Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany"],"affiliations":[{"raw_affiliation_string":"Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany","institution_ids":["https://openalex.org/I121797337"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062646838","display_name":"Thomas B\u00e4ck","orcid":"https://orcid.org/0000-0001-6768-1478"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Thomas B\u00e4ck","raw_affiliation_strings":["Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany"],"affiliations":[{"raw_affiliation_string":"Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany","institution_ids":["https://openalex.org/I121797337"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065525958","display_name":"Adriaan P. IJzerman","orcid":"https://orcid.org/0000-0002-1182-2259"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Ad P. IJzerman","raw_affiliation_strings":["Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany"],"affiliations":[{"raw_affiliation_string":"Division of Medicinal Chemistry, Leiden/Amsterdam Center for Drug Research, Leiden University, Einsteinweg 55, 2300 RA Leiden, The Netherlands, Leiden Institute of Advanced Computer Science (LIACS), Leiden University, Niels Bohrweg 1, 2333 CA Leiden, The Netherlands, and NuTech Solutions, Martin-Schmeisser-Weg 15, 44227 Dortmund, Germany","institution_ids":["https://openalex.org/I121797337"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047891732"],"corresponding_institution_ids":["https://openalex.org/I121797337"],"apc_list":null,"apc_paid":null,"fwci":4.9054,"has_fulltext":false,"cited_by_count":47,"citation_normalized_percentile":{"value":0.95526548,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"46","issue":"2","first_page":"553","last_page":"562"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10252","display_name":"Microbial Natural Products and Biosynthesis","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2736","display_name":"Pharmacology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10911","display_name":"Chemical Synthesis and Analysis","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chemical-space","display_name":"Chemical space","score":0.8559510111808777},{"id":"https://openalex.org/keywords/fragment","display_name":"Fragment (logic)","score":0.7763700485229492},{"id":"https://openalex.org/keywords/listing","display_name":"Listing (finance)","score":0.7047716379165649},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.64898681640625},{"id":"https://openalex.org/keywords/chemical-database","display_name":"Chemical database","score":0.6236542463302612},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4749845862388611},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.4554031789302826},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.45375514030456543},{"id":"https://openalex.org/keywords/yield","display_name":"Yield (engineering)","score":0.45320039987564087},{"id":"https://openalex.org/keywords/combinatorial-chemistry","display_name":"Combinatorial chemistry","score":0.3494676947593689},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3384914994239807},{"id":"https://openalex.org/keywords/drug-discovery","display_name":"Drug discovery","score":0.2756626009941101},{"id":"https://openalex.org/keywords/organic-chemistry","display_name":"Organic chemistry","score":0.1520693600177765},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.14804667234420776},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12466159462928772}],"concepts":[{"id":"https://openalex.org/C99726746","wikidata":"https://www.wikidata.org/wiki/Q906396","display_name":"Chemical space","level":3,"score":0.8559510111808777},{"id":"https://openalex.org/C2776235265","wikidata":"https://www.wikidata.org/wiki/Q18392052","display_name":"Fragment (logic)","level":2,"score":0.7763700485229492},{"id":"https://openalex.org/C2779820595","wikidata":"https://www.wikidata.org/wiki/Q798505","display_name":"Listing (finance)","level":2,"score":0.7047716379165649},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.64898681640625},{"id":"https://openalex.org/C203394866","wikidata":"https://www.wikidata.org/wiki/Q2881060","display_name":"Chemical database","level":2,"score":0.6236542463302612},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4749845862388611},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.4554031789302826},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.45375514030456543},{"id":"https://openalex.org/C134121241","wikidata":"https://www.wikidata.org/wiki/Q899301","display_name":"Yield (engineering)","level":2,"score":0.45320039987564087},{"id":"https://openalex.org/C21951064","wikidata":"https://www.wikidata.org/wiki/Q899212","display_name":"Combinatorial chemistry","level":1,"score":0.3494676947593689},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3384914994239807},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.2756626009941101},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.1520693600177765},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.14804667234420776},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12466159462928772},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000970","descriptor_name":"Antineoplastic Agents","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D000970","descriptor_name":"Antineoplastic Agents","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D000970","descriptor_name":"Antineoplastic Agents","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D003975","descriptor_name":"Diazepam","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D003975","descriptor_name":"Diazepam","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D003975","descriptor_name":"Diazepam","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013329","descriptor_name":"Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015195","descriptor_name":"Drug Design","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015394","descriptor_name":"Molecular Structure","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015394","descriptor_name":"Molecular Structure","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015394","descriptor_name":"Molecular Structure","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019992","descriptor_name":"Databases as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019992","descriptor_name":"Databases as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019992","descriptor_name":"Databases as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/ci050370c","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci050370c","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:16562983","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/16562983","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1574994167","https://openalex.org/W1592238003","https://openalex.org/W1966785965","https://openalex.org/W1977340881","https://openalex.org/W1991286793","https://openalex.org/W2003932717","https://openalex.org/W2010624162","https://openalex.org/W2014540789","https://openalex.org/W2029213117","https://openalex.org/W2038702914","https://openalex.org/W2039174451","https://openalex.org/W2060531713","https://openalex.org/W2064885619","https://openalex.org/W2135732933","https://openalex.org/W2146984355","https://openalex.org/W2166478947","https://openalex.org/W2176516200"],"related_works":["https://openalex.org/W2023630889","https://openalex.org/W1980425862","https://openalex.org/W131203294","https://openalex.org/W2043850786","https://openalex.org/W2963031998","https://openalex.org/W4244321733","https://openalex.org/W1997389443","https://openalex.org/W2151971404","https://openalex.org/W2087762413","https://openalex.org/W2167187529"],"abstract_inverted_index":{"Nowadays":[0],"millions":[1],"of":[2,14,24,29,38,52,71,82,94,126,176,181],"different":[3],"compounds":[4,136],"are":[5,96],"known,":[6],"their":[7,129],"structures":[8],"stored":[9],"in":[10,74],"electronic":[11],"databases.":[12],"Analysis":[13],"these":[15],"data":[16,111],"could":[17],"yield":[18],"valuable":[19],"insights":[20],"into":[21,55,115],"the":[22,27,35,39,50,69,80,109,116,141,177],"laws":[23],"chemistry":[25],"and":[26,67,92,128,144,150,171],"habits":[28],"chemists.":[30],"We":[31,48,106],"have":[32],"therefore":[33,145],"explored":[34,119],"public":[36],"database":[37,54],"National":[40],"Cancer":[41],"Institute":[42],"(>250,000":[43],"compounds)":[44],"by":[45,122,137],"pattern":[46],"searching.":[47],"split":[49],"molecules":[51],"this":[53],"fragments":[56,61,91,95,127,165],"to":[57,79],"find":[58],"out":[59,88,174],"which":[60],"exist,":[62],"how":[63],"frequent":[64,98],"they":[65,100],"are,":[66],"whether":[68],"occurrence":[70,81],"one":[72],"fragment":[73,110],"a":[75],"molecule":[76],"is":[77],"related":[78],"another,":[83],"nonoverlapping":[84],"fragment.":[85],"It":[86],"turns":[87],"that":[89,99,108],"some":[90,175],"combinations":[93],"so":[97,120],"can":[101,112,131],"be":[102],"called":[103],"\"chemical":[104],"clich\u00e9s\".":[105],"believe":[107],"give":[113],"insight":[114],"chemical":[117,135,182],"space":[118],"far":[121],"synthesis.":[123],"The":[124],"lists":[125],"(co-)occurrences":[130],"help":[132],"create":[133],"novel":[134],"(i)":[138],"systematically":[139],"listing":[140],"most":[142,146],"popular":[143],"easily":[147,160],"used":[148],"substituents":[149],"ring":[151],"systems":[152],"for":[153,163,167],"synthesizing":[154],"new":[155],"compounds,":[156],"(ii)":[157],"being":[158],"an":[159],"accessible":[161],"repository":[162],"rarer":[164],"suitable":[166],"lead":[168],"compound":[169],"optimization,":[170],"(iii)":[172],"pointing":[173],"yet":[178],"unexplored":[179],"parts":[180],"space.":[183]},"counts_by_year":[{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
