{"id":"https://openalex.org/W2017908538","doi":"https://doi.org/10.1021/ci100319n","title":"Identification of Descriptors Capturing Compound Class-Specific Features by Mutual Information Analysis","display_name":"Identification of Descriptors Capturing Compound Class-Specific Features by Mutual Information Analysis","publication_year":2010,"publication_date":"2010-10-20","ids":{"openalex":"https://openalex.org/W2017908538","doi":"https://doi.org/10.1021/ci100319n","mag":"2017908538","pmid":"https://pubmed.ncbi.nlm.nih.gov/20961115"},"language":"en","primary_location":{"id":"doi:10.1021/ci100319n","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci100319n","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023868486","display_name":"Anne Mai Wassermann","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Anne Mai Wassermann","raw_affiliation_strings":["Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089699813","display_name":"Britta Nisius","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Britta Nisius","raw_affiliation_strings":["Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016304883","display_name":"Martin Vogt","orcid":"https://orcid.org/0000-0002-3931-9516"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Vogt","raw_affiliation_strings":["Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039926688","display_name":"J\u00fcrgen Bajorath","orcid":"https://orcid.org/0000-0002-0557-5714"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"J\u00fcrgen Bajorath","raw_affiliation_strings":["Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Life Science Informatics, B-IT, Rheinische Friedrich-Wilhelms-Universit\u00e4t, Dahlmannstrasse 2, D-53113 Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5023868486"],"corresponding_institution_ids":["https://openalex.org/I135140700"],"apc_list":null,"apc_paid":null,"fwci":2.0072,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.85921654,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"50","issue":"11","first_page":"1935","last_page":"1940"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9369000196456909,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9363999962806702,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.6414414644241333},{"id":"https://openalex.org/keywords/cheminformatics","display_name":"Cheminformatics","score":0.6274887323379517},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5806030631065369},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5542020797729492},{"id":"https://openalex.org/keywords/interaction-information","display_name":"Interaction information","score":0.5518758893013},{"id":"https://openalex.org/keywords/information-theory","display_name":"Information theory","score":0.5390026569366455},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49523916840553284},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.47795891761779785},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41927871108055115},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.41641905903816223},{"id":"https://openalex.org/keywords/joint-entropy","display_name":"Joint entropy","score":0.41639912128448486},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.39108115434646606},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3247172236442566},{"id":"https://openalex.org/keywords/principle-of-maximum-entropy","display_name":"Principle of maximum entropy","score":0.2873753011226654},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13366234302520752},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.09644126892089844}],"concepts":[{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.6414414644241333},{"id":"https://openalex.org/C68762167","wikidata":"https://www.wikidata.org/wiki/Q910164","display_name":"Cheminformatics","level":2,"score":0.6274887323379517},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5806030631065369},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5542020797729492},{"id":"https://openalex.org/C38764148","wikidata":"https://www.wikidata.org/wiki/Q17098245","display_name":"Interaction information","level":2,"score":0.5518758893013},{"id":"https://openalex.org/C52622258","wikidata":"https://www.wikidata.org/wiki/Q131222","display_name":"Information theory","level":2,"score":0.5390026569366455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49523916840553284},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.47795891761779785},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41927871108055115},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.41641905903816223},{"id":"https://openalex.org/C106752470","wikidata":"https://www.wikidata.org/wiki/Q1364826","display_name":"Joint entropy","level":3,"score":0.41639912128448486},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.39108115434646606},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3247172236442566},{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.2873753011226654},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13366234302520752},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.09644126892089844},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D002621","descriptor_name":"Chemistry","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D002621","descriptor_name":"Chemistry","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D002621","descriptor_name":"Chemistry","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D048088","descriptor_name":"Informatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D048088","descriptor_name":"Informatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D048088","descriptor_name":"Informatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1021/ci100319n","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci100319n","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:20961115","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/20961115","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1545231783","https://openalex.org/W1970651561","https://openalex.org/W1978914444","https://openalex.org/W1995875735","https://openalex.org/W2021775801","https://openalex.org/W2034038739","https://openalex.org/W2060217572","https://openalex.org/W2080734107","https://openalex.org/W2088967604","https://openalex.org/W2099111195","https://openalex.org/W2146950091","https://openalex.org/W2176516200"],"related_works":["https://openalex.org/W2057609120","https://openalex.org/W2903913648","https://openalex.org/W986037092","https://openalex.org/W4225940264","https://openalex.org/W2101924850","https://openalex.org/W4313429060","https://openalex.org/W2996336810","https://openalex.org/W2111510771","https://openalex.org/W2295845123","https://openalex.org/W2075237332"],"abstract_inverted_index":{"The":[0,120],"identification":[1],"of":[2,11,46,72],"molecular":[3],"descriptors":[4,23,83,101],"that":[5,87],"contain":[6],"compound":[7,35,134],"class-specific":[8],"information":[9,30,62,113,118],"is":[10,24,124],"high":[12],"relevance":[13],"in":[14,32,39,65,90],"chemoinformatics.":[15],"A":[16],"generally":[17],"applicable":[18],"way":[19],"to":[20,25,80,97],"identify":[21],"such":[22,100],"determine":[26],"and":[27,38,129],"compare":[28],"their":[29],"content":[31],"a":[33,95],"given":[34],"activity":[36,135],"class":[37],"large":[40],"databases":[41],"where":[42],"the":[43,51,57,104],"vast":[44],"majority":[45],"compounds":[47],"do":[48],"not":[49],"have":[50],"desired":[52],"activity.":[53],"For":[54],"this":[55,73],"purpose,":[56],"Shannon":[58,108],"entropy":[59,109],"concept":[60,74,116],"from":[61,117],"theory":[63],"can":[64],"principle":[66],"be":[67],"employed.":[68],"However,":[69],"previous":[70],"adaptations":[71],"for":[75,84],"descriptor":[76,127],"profiling":[77],"are":[78],"insufficient":[79],"select":[81,99],"discriminatory":[82],"data":[85],"sets":[86],"dramatically":[88],"differ":[89],"size.":[91],"Therefore,":[92],"we":[93],"introduce":[94],"methodology":[96],"reliably":[98],"by":[102,126],"transforming":[103],"previously":[105],"introduced":[106,122],"differential":[107],"formalism":[110],"into":[111],"mutual":[112],"analysis,":[114],"another":[115],"theory.":[119],"newly":[121],"approach":[123],"evaluated":[125],"ranking":[128],"correlation":[130],"analysis":[131],"on":[132],"168":[133],"classes.":[136]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
