{"id":"https://openalex.org/W2055246239","doi":"https://doi.org/10.1021/ci2000083","title":"Comparison of Combinatorial Clustering Methods on Pharmacological Data Sets Represented by Machine Learning-Selected Real Molecular Descriptors","display_name":"Comparison of Combinatorial Clustering Methods on Pharmacological Data Sets Represented by Machine Learning-Selected Real Molecular Descriptors","publication_year":2011,"publication_date":"2011-11-18","ids":{"openalex":"https://openalex.org/W2055246239","doi":"https://doi.org/10.1021/ci2000083","mag":"2055246239","pmid":"https://pubmed.ncbi.nlm.nih.gov/22098113"},"language":"en","primary_location":{"id":"doi:10.1021/ci2000083","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci2000083","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010951953","display_name":"Oscar Rivera-Borroto","orcid":null},"institutions":[{"id":"https://openalex.org/I3018837529","display_name":"Universidad Central \"Marta Abreu\" de las Villas (UCLV)","ror":"https://ror.org/01cdy6h50","country_code":"CU","type":"education","lineage":["https://openalex.org/I3018837529"]}],"countries":["CU"],"is_corresponding":true,"raw_author_name":"Oscar Miguel Rivera-Borroto","raw_affiliation_strings":["Laboratorio de Bioinform\u00e1tica, Centro de Estudios de Inform\u00e1tica, Facultad de Matem\u00e1tica, F\u00edsica y Computaci\u00f3n, Universidad Central \u201cMarta Abreu\u201d de Las Villas (UCLV), Santa Clara, 54830 Villa Clara, Cuba","Unit of Computer-Aided Molecular \u201cBiosilico\u201d Discovery and Bioinformatic Research (CAMD-BIR Unit), Faculty of Chemistry-Pharmacy, Central University of Las Villas, Santa Clara, 54830 Villa Clara, Cuba"],"affiliations":[{"raw_affiliation_string":"Laboratorio de Bioinform\u00e1tica, Centro de Estudios de Inform\u00e1tica, Facultad de Matem\u00e1tica, F\u00edsica y Computaci\u00f3n, Universidad Central \u201cMarta Abreu\u201d de Las Villas (UCLV), Santa Clara, 54830 Villa Clara, Cuba","institution_ids":["https://openalex.org/I3018837529"]},{"raw_affiliation_string":"Unit of Computer-Aided Molecular \u201cBiosilico\u201d Discovery and Bioinformatic Research (CAMD-BIR Unit), Faculty of Chemistry-Pharmacy, Central University of Las Villas, Santa Clara, 54830 Villa Clara, Cuba","institution_ids":["https://openalex.org/I3018837529"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015398632","display_name":"Yovani Marrero\u2010Ponce","orcid":"https://orcid.org/0000-0003-2721-1142"},"institutions":[{"id":"https://openalex.org/I3018837529","display_name":"Universidad Central \"Marta Abreu\" de las Villas (UCLV)","ror":"https://ror.org/01cdy6h50","country_code":"CU","type":"education","lineage":["https://openalex.org/I3018837529"]}],"countries":["CU"],"is_corresponding":false,"raw_author_name":"Yovani Marrero-Ponce","raw_affiliation_strings":["Unit of Computer-Aided Molecular \u201cBiosilico\u201d Discovery and Bioinformatic Research (CAMD-BIR Unit), Faculty of Chemistry-Pharmacy, Central University of Las Villas, Santa Clara, 54830 Villa Clara, Cuba"],"affiliations":[{"raw_affiliation_string":"Unit of Computer-Aided Molecular \u201cBiosilico\u201d Discovery and Bioinformatic Research (CAMD-BIR Unit), Faculty of Chemistry-Pharmacy, Central University of Las Villas, Santa Clara, 54830 Villa Clara, Cuba","institution_ids":["https://openalex.org/I3018837529"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017047972","display_name":"Jos\u00e9 M. Garc\u0131\u0301a de la Vega","orcid":"https://orcid.org/0000-0002-1940-422X"},"institutions":[{"id":"https://openalex.org/I63634437","display_name":"Universidad Aut\u00f3noma de Madrid","ror":"https://ror.org/01cby8j38","country_code":"ES","type":"education","lineage":["https://openalex.org/I63634437"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Manuel Garc\u00eda-de la Vega","raw_affiliation_strings":["Departamento de Qu\u00edmica F\u00edsica Aplicada, Facultad de Ciencias, Universidad Aut\u00f3noma de Madrid (UAM), 28049 Madrid, Spain"],"affiliations":[{"raw_affiliation_string":"Departamento de Qu\u00edmica F\u00edsica Aplicada, Facultad de Ciencias, Universidad Aut\u00f3noma de Madrid (UAM), 28049 Madrid, Spain","institution_ids":["https://openalex.org/I63634437"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071914516","display_name":"Ricardo Grau-Abalo","orcid":null},"institutions":[{"id":"https://openalex.org/I3018837529","display_name":"Universidad Central \"Marta Abreu\" de las Villas (UCLV)","ror":"https://ror.org/01cdy6h50","country_code":"CU","type":"education","lineage":["https://openalex.org/I3018837529"]}],"countries":["CU"],"is_corresponding":false,"raw_author_name":"Ricardo del Coraz\u00f3n Grau-\u00c1balo","raw_affiliation_strings":["Laboratorio de Bioinform\u00e1tica, Centro de Estudios de Inform\u00e1tica, Facultad de Matem\u00e1tica, F\u00edsica y Computaci\u00f3n, Universidad Central \u201cMarta Abreu\u201d de Las Villas (UCLV), Santa Clara, 54830 Villa Clara, Cuba"],"affiliations":[{"raw_affiliation_string":"Laboratorio de Bioinform\u00e1tica, Centro de Estudios de Inform\u00e1tica, Facultad de Matem\u00e1tica, F\u00edsica y Computaci\u00f3n, Universidad Central \u201cMarta Abreu\u201d de Las Villas (UCLV), Santa Clara, 54830 Villa Clara, Cuba","institution_ids":["https://openalex.org/I3018837529"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5010951953"],"corresponding_institution_ids":["https://openalex.org/I3018837529"],"apc_list":null,"apc_paid":null,"fwci":3.4522,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.92617707,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"51","issue":"12","first_page":"3036","last_page":"3049"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9851999878883362,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7338346242904663},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5703642964363098},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.53801029920578},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5018210411071777},{"id":"https://openalex.org/keywords/molecular-descriptor","display_name":"Molecular descriptor","score":0.48784661293029785},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4298046827316284},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36505648493766785},{"id":"https://openalex.org/keywords/quantitative-structure\u2013activity-relationship","display_name":"Quantitative structure\u2013activity relationship","score":0.08292484283447266}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7338346242904663},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5703642964363098},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.53801029920578},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5018210411071777},{"id":"https://openalex.org/C164923092","wikidata":"https://www.wikidata.org/wiki/Q3705921","display_name":"Molecular descriptor","level":3,"score":0.48784661293029785},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4298046827316284},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36505648493766785},{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.08292484283447266}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004364","descriptor_name":"Pharmaceutical Preparations","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008954","descriptor_name":"Models, Biological","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010600","descriptor_name":"Pharmacology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010600","descriptor_name":"Pharmacology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010600","descriptor_name":"Pharmacology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D021281","descriptor_name":"Quantitative Structure-Activity Relationship","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/ci2000083","is_oa":false,"landing_page_url":"https://doi.org/10.1021/ci2000083","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:22098113","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/22098113","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":80,"referenced_works":["https://openalex.org/W6602908","https://openalex.org/W577239568","https://openalex.org/W945546923","https://openalex.org/W1565746575","https://openalex.org/W1576808520","https://openalex.org/W1619226191","https://openalex.org/W1942764728","https://openalex.org/W1965351956","https://openalex.org/W1965534201","https://openalex.org/W1966166469","https://openalex.org/W1968680412","https://openalex.org/W1969901779","https://openalex.org/W1978163942","https://openalex.org/W1979335751","https://openalex.org/W1983439863","https://openalex.org/W1989897839","https://openalex.org/W1990451437","https://openalex.org/W1992419399","https://openalex.org/W1992579349","https://openalex.org/W1993492933","https://openalex.org/W1999118725","https://openalex.org/W2000376564","https://openalex.org/W2005685204","https://openalex.org/W2007995029","https://openalex.org/W2010528862","https://openalex.org/W2021083597","https://openalex.org/W2021827987","https://openalex.org/W2030909788","https://openalex.org/W2032245355","https://openalex.org/W2041268285","https://openalex.org/W2041282815","https://openalex.org/W2042007894","https://openalex.org/W2047109555","https://openalex.org/W2049615701","https://openalex.org/W2050451453","https://openalex.org/W2056272907","https://openalex.org/W2056308251","https://openalex.org/W2056580937","https://openalex.org/W2057445960","https://openalex.org/W2066845970","https://openalex.org/W2068937739","https://openalex.org/W2070598941","https://openalex.org/W2076391130","https://openalex.org/W2079225303","https://openalex.org/W2082194907","https://openalex.org/W2090704155","https://openalex.org/W2092027887","https://openalex.org/W2095642553","https://openalex.org/W2097745317","https://openalex.org/W2107432340","https://openalex.org/W2109535575","https://openalex.org/W2114772807","https://openalex.org/W2118587067","https://openalex.org/W2125253492","https://openalex.org/W2133990480","https://openalex.org/W2141807666","https://openalex.org/W2149339479","https://openalex.org/W2153922613","https://openalex.org/W2158024647","https://openalex.org/W2158698691","https://openalex.org/W2163212577","https://openalex.org/W2169284845","https://openalex.org/W2177658341","https://openalex.org/W2197388599","https://openalex.org/W2204197091","https://openalex.org/W2213138713","https://openalex.org/W2317442797","https://openalex.org/W2319660501","https://openalex.org/W2320034101","https://openalex.org/W2515184929","https://openalex.org/W2554073607","https://openalex.org/W2798084948","https://openalex.org/W2951528848","https://openalex.org/W3089502740","https://openalex.org/W3103913776","https://openalex.org/W4206744857","https://openalex.org/W4213151958","https://openalex.org/W4240236152","https://openalex.org/W4247989331","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4298130764","https://openalex.org/W2804364458","https://openalex.org/W2132641928","https://openalex.org/W4310225030","https://openalex.org/W2090259340","https://openalex.org/W2393816671","https://openalex.org/W2158836806","https://openalex.org/W2083665254","https://openalex.org/W1926736923","https://openalex.org/W2942177010"],"abstract_inverted_index":{"Cluster":[0],"algorithms":[1,237,244,263],"play":[2],"an":[3],"important":[4],"role":[5],"in":[6,18,58,86,124,147,164,251,267,282],"diversity":[7],"related":[8],"tasks":[9],"of":[10,26,45,53,96,120,143,193,200,211,226,231,233,261],"modern":[11],"chemoinformatics,":[12],"with":[13,187,208,213,223],"the":[14,62,67,121,165,188,194,201,224,234,252],"widest":[15],"applications":[16],"being":[17,145],"pharmaceutical":[19],"industry":[20],"drug":[21,170],"discovery":[22],"programs.":[23],"The":[24,149,259],"performance":[25,240],"these":[27,262],"grouping":[28,125],"strategies":[29],"depends":[30],"on":[31,75],"various":[32],"factors":[33],"such":[34],"as":[35,83],"molecular":[36,81,177,217],"representation,":[37],"mathematical":[38],"method,":[39],"algorithmical":[40],"technique,":[41],"and":[42,51,109,111,162,215,245,274],"statistical":[43],"distribution":[44],"data.":[46],"For":[47],"this":[48,87,133],"reason,":[49],"introduction":[50],"comparison":[52,136],"new":[54],"methods":[55,123,139],"are":[56,151,159,185,246],"necessary":[57],"order":[59],"to":[60,256,271],"find":[61],"model":[63],"that":[64,158,197],"best":[65],"fits":[66],"problem":[68],"at":[69],"hand.":[70],"Earlier":[71],"comparative":[72,114,269],"studies":[73,115],"report":[74],"Ward's":[76,257],"algorithm":[77],"using":[78,154],"fingerprints":[79],"for":[80],"description":[82],"generally":[84],"superior":[85,239,250],"field.":[88],"However,":[89],"problems":[90,221],"still":[91],"remain,":[92],"i.e.,":[93],"other":[94],"types":[95],"numerical":[97],"descriptions":[98],"have":[99,129],"been":[100,130],"little":[101],"exploited,":[102],"current":[103],"descriptors":[104,178],"selection":[105],"strategy":[106],"is":[107,140,264],"trial":[108],"error-driven,":[110],"no":[112],"previous":[113],"considering":[116],"a":[117,135,209,268],"broader":[118],"domain":[119],"combinatorial":[122,138],"chemoinformatic":[126],"data":[127,156,171,203],"sets":[128,157,204],"conducted.":[131],"In":[132],"work,":[134],"between":[137],"performed,with":[141],"five":[142,232],"them":[144],"novel":[146],"cheminformatics.":[148],"experiments":[150],"carried":[152],"out":[153,230],"eight":[155,202],"well":[160],"established":[161],"validated":[163],"medical":[166],"chemistry":[167],"literature.":[168],"Each":[169],"set":[172],"was":[173],"represented":[174],"by":[175,180],"real":[176],"selected":[179],"machine":[181,275],"learning":[182,276],"techniques,":[183],"which":[184],"consistent":[186],"neighborhood":[189],"principle.":[190],"Statistical":[191],"analysis":[192],"results":[195],"demonstrates":[196],"pharmacological":[198],"activities":[199],"can":[205],"be":[206],"modeled":[207],"few":[210],"families":[212],"2D":[214],"3D":[216],"descriptors,":[218],"avoiding":[219],"classification":[220],"associated":[222],"presence":[225],"nonrelevant":[227],"features.":[228],"Three":[229],"proposed":[235],"cluster":[236],"show":[238],"over":[241],"most":[242,253],"classical":[243],"similar":[247],"(or":[248],"slightly":[249],"optimistic":[254],"sense)":[255],"algorithm.":[258],"usefulness":[260],"also":[265],"assessed":[266],"experiment":[270],"potent":[272],"QSAR":[273],"classifiers,":[277],"where":[278],"they":[279],"perform":[280],"similarly":[281],"some":[283],"cases.":[284]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
