{"id":"https://openalex.org/W4410968660","doi":"https://doi.org/10.1021/acs.jcim.5c00539","title":"Hierarchical Extended Linkage Method (HELM)\u2019s Deep Dive into Hybrid Clustering Strategies","display_name":"Hierarchical Extended Linkage Method (HELM)\u2019s Deep Dive into Hybrid Clustering Strategies","publication_year":2025,"publication_date":"2025-06-02","ids":{"openalex":"https://openalex.org/W4410968660","doi":"https://doi.org/10.1021/acs.jcim.5c00539","pmid":"https://pubmed.ncbi.nlm.nih.gov/40452401"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c00539","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00539","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046415026","display_name":"Lexin Chen","orcid":"https://orcid.org/0000-0002-9528-942X"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lexin Chen","raw_affiliation_strings":["Department of Chemistry and Quantum Theory Project","University of Florida","Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045449780","display_name":"J. Santos","orcid":"https://orcid.org/0000-0001-9030-702X"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jherome Brylle Woody Santos","raw_affiliation_strings":["Department of Chemistry and Quantum Theory Project","University of Florida","Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004875412","display_name":"Jokent T. Gaza","orcid":"https://orcid.org/0000-0002-7836-4539"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jokent Gaza","raw_affiliation_strings":["Department of Chemistry and Quantum Theory Project","University of Florida","Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063704705","display_name":"Alberto P\u00e9rez","orcid":"https://orcid.org/0000-0002-5054-5338"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alberto Perez","raw_affiliation_strings":["Department of Chemistry and Quantum Theory Project","University of Florida","Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039322037","display_name":"Ram\u00f3n Alain Miranda\u2010Quintana","orcid":"https://orcid.org/0000-0003-2121-4449"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ram\u00f3n Alain Miranda-Quintana","raw_affiliation_strings":["Department of Chemistry and Quantum Theory Project","University of Florida","Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Chemistry and Quantum Theory Project, University of Florida, Gainesville 32611, Florida, United States","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5039322037"],"corresponding_institution_ids":["https://openalex.org/I33213144"],"apc_list":null,"apc_paid":null,"fwci":4.8438,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.95191182,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"65","issue":"12","first_page":"6209","last_page":"6220"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.74961918592453},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6395868062973022},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.5825260877609253},{"id":"https://openalex.org/keywords/linkage","display_name":"Linkage (software)","score":0.524848461151123},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5103561282157898},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5006630420684814},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.49898791313171387},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.4504554867744446},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4124853312969208},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3634968400001526},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32420867681503296},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24977341294288635},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17036747932434082},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.09236857295036316}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74961918592453},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6395868062973022},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.5825260877609253},{"id":"https://openalex.org/C31266012","wikidata":"https://www.wikidata.org/wiki/Q6554340","display_name":"Linkage (software)","level":3,"score":0.524848461151123},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5103561282157898},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5006630420684814},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.49898791313171387},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.4504554867744446},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4124853312969208},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3634968400001526},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32420867681503296},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24977341294288635},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17036747932434082},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.09236857295036316},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004247","descriptor_name":"DNA","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004247","descriptor_name":"DNA","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D056004","descriptor_name":"Molecular Dynamics Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D056004","descriptor_name":"Molecular Dynamics Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.5c00539","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00539","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:40452401","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40452401","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3926417061","display_name":null,"funder_award_id":"R35GM150620","funder_id":"https://openalex.org/F4320337354","funder_display_name":"National Institute of General Medical Sciences"},{"id":"https://openalex.org/G4292987561","display_name":null,"funder_award_id":"CHE-2235785","funder_id":"https://openalex.org/F4320337393","funder_display_name":"Division of Chemistry"}],"funders":[{"id":"https://openalex.org/F4320337354","display_name":"National Institute of General Medical Sciences","ror":"https://ror.org/04q48ey07"},{"id":"https://openalex.org/F4320337393","display_name":"Division of Chemistry","ror":"https://ror.org/01ar8dr59"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1128809682","https://openalex.org/W1980317569","https://openalex.org/W1987971958","https://openalex.org/W1990368529","https://openalex.org/W2016381774","https://openalex.org/W2028130802","https://openalex.org/W2029064186","https://openalex.org/W2040809566","https://openalex.org/W2051224630","https://openalex.org/W2085487226","https://openalex.org/W2122932522","https://openalex.org/W2136729627","https://openalex.org/W2136849653","https://openalex.org/W2156825747","https://openalex.org/W2163915395","https://openalex.org/W2204959575","https://openalex.org/W2277366394","https://openalex.org/W2329540625","https://openalex.org/W2332712348","https://openalex.org/W2404280981","https://openalex.org/W2417065262","https://openalex.org/W2552029149","https://openalex.org/W2619824656","https://openalex.org/W2949223833","https://openalex.org/W2991285488","https://openalex.org/W3021303688","https://openalex.org/W3144750446","https://openalex.org/W3153640839","https://openalex.org/W3156755596","https://openalex.org/W3159156584","https://openalex.org/W3216238908","https://openalex.org/W4205177560","https://openalex.org/W4225120470","https://openalex.org/W4281688690","https://openalex.org/W4289948291","https://openalex.org/W4318898843","https://openalex.org/W4396712309","https://openalex.org/W4399879257","https://openalex.org/W4400466484","https://openalex.org/W4401496991","https://openalex.org/W4403058913","https://openalex.org/W4405056329","https://openalex.org/W4405334031"],"related_works":["https://openalex.org/W2487162673","https://openalex.org/W2793211469","https://openalex.org/W2949152769","https://openalex.org/W4372354731","https://openalex.org/W2942366970","https://openalex.org/W2807634898","https://openalex.org/W1692008701","https://openalex.org/W3122664346","https://openalex.org/W2023397165","https://openalex.org/W2992250188"],"abstract_inverted_index":{"Clustering":[0],"remains":[1],"a":[2,61,111,123,157],"key":[3,147],"tool":[4],"in":[5,39,84,199],"the":[6,14,20,40,50,75,82,91,117,127,135,141,150,161,167,173,185],"analysis":[7,187],"of":[8,16,22,65,77,137,143,152,169,175,188],"molecular":[9],"dynamics":[10],"(MD)":[11],"simulations,":[12],"from":[13,60],"preparation":[15],"kinetic":[17],"models":[18],"to":[19,80,106,109,159],"study":[21],"mechanistic":[23],"pathways":[24],"and":[25,45,70,102,164,180],"structural":[26],"determination.":[27],"It":[28],"is":[29,57,149,196],"no":[30],"surprise":[31],"then":[32],"that":[33,133],"multiple":[34],"algorithms":[35],"are":[36],"currently":[37],"used":[38],"MD":[41],"community,":[42],"with":[43,99,190],"<i>k</i>-means":[44,138,162],"hierarchical":[46,128,144],"approaches":[47],"being":[48,78],"arguably":[49],"two":[51],"most":[52],"popular":[53],"approaches.":[54],"The":[55,146],"former":[56],"very":[58,85],"attractive":[59],"purely":[62],"computational":[63],"point":[64],"view,":[66],"demanding":[67],"minimal":[68],"memory":[69,101],"time":[71,103],"resources,":[72],"but":[73,98],"at":[74],"price":[76],"able":[79],"partition":[81],"data":[83],"restrictive":[86],"ways.":[87],"Hierarchical":[88],"strategies,":[89],"on":[90],"other":[92],"hand,":[93],"can":[94],"generate":[95],"arbitrary":[96],"partitions,":[97],"steep":[100],"requirements":[104],"due":[105],"their":[107],"need":[108],"build":[110,166],"pairwise":[112],"distance":[113],"matrix":[114],"for":[115],"all":[116],"considered":[118],"conformations/frames.":[119],"Here":[120],"we":[121],"propose":[122],"new":[124],"hybrid":[125],"paradigm,":[126],"extended":[129],"linkage":[130],"method":[131],"(HELM),":[132],"retains":[134],"efficiency":[136],"while":[139],"incorporating":[140],"flexibility":[142],"methods.":[145],"ingredient":[148],"use":[151],"<i>n</i>-ary":[153],"difference":[154],"functions":[155],"as":[156],"way":[158],"stabilize":[160],"results":[163],"efficiently":[165],"hierarchy":[168],"subsets.":[170],"We":[171],"showcase":[172],"applicability":[174],"this":[176],"strategy":[177],"over":[178,191],"protein-DNA":[179],"protein":[181],"folding":[182],"studies,":[183],"including":[184],"complete":[186],"simulations":[189],"1.5":[192],"million":[193],"frames.":[194],"HELM":[195],"freely":[197],"available":[198],"our":[200],"MDANCE":[201],"clustering":[202],"package.":[203]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
