{"id":"https://openalex.org/W2092793778","doi":"https://doi.org/10.1186/1471-2105-14-11","title":"An improved method to detect correct protein folds using partial clustering","display_name":"An improved method to detect correct protein folds using partial clustering","publication_year":2013,"publication_date":"2013-01-16","ids":{"openalex":"https://openalex.org/W2092793778","doi":"https://doi.org/10.1186/1471-2105-14-11","mag":"2092793778","pmid":"https://pubmed.ncbi.nlm.nih.gov/23323835"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-14-11","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-14-11","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-14-11","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-14-11","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024564391","display_name":"Jianjun Zhou","orcid":"https://orcid.org/0000-0001-9122-2933"},"institutions":[{"id":"https://openalex.org/I4210089559","display_name":"Shenzhen Metro (China)","ror":"https://ror.org/008hpge95","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210089559"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jianjun Zhou","raw_affiliation_strings":["JHK Co., Ltd., 2049 Heping Road, Shenzhen, Guangdong 518010, China","JHK Co., Ltd., Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"JHK Co., Ltd., 2049 Heping Road, Shenzhen, Guangdong 518010, China","institution_ids":[]},{"raw_affiliation_string":"JHK Co., Ltd., Shenzhen, China","institution_ids":["https://openalex.org/I4210089559"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003573061","display_name":"David S. Wishart","orcid":"https://orcid.org/0000-0002-3207-2434"},"institutions":[{"id":"https://openalex.org/I86897205","display_name":"Athabasca University","ror":"https://ror.org/01y3xgc52","country_code":"CA","type":"education","lineage":["https://openalex.org/I86897205"]},{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"David S Wishart","raw_affiliation_strings":["Departments of Computing Science and Biological Sciences, 2-21 Athabasca Hall, University of Alberta, Edmonton, Alberta, T6G 2E8, Canada","Departments of Computing Science and Biological Sciences, 2\u201321 Athabasca Hall, University of Alberta, Edmonton, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of Computing Science and Biological Sciences, 2-21 Athabasca Hall, University of Alberta, Edmonton, Alberta, T6G 2E8, Canada","institution_ids":["https://openalex.org/I86897205","https://openalex.org/I154425047"]},{"raw_affiliation_string":"Departments of Computing Science and Biological Sciences, 2\u201321 Athabasca Hall, University of Alberta, Edmonton, Canada","institution_ids":["https://openalex.org/I154425047"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5024564391"],"corresponding_institution_ids":["https://openalex.org/I4210089559"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":1.9445,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.86091812,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"14","issue":"1","first_page":"11","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.6525999903678894,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.6525999903678894,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.12770000100135803,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.10649999976158142,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoy","display_name":"Decoy","score":0.9447662830352783},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8457422256469727},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6405267119407654},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6232234835624695},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5132200717926025},{"id":"https://openalex.org/keywords/protein-structure-prediction","display_name":"Protein structure prediction","score":0.5080602169036865},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4676347076892853},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.393950492143631},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35590189695358276},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.12920716404914856}],"concepts":[{"id":"https://openalex.org/C2779179475","wikidata":"https://www.wikidata.org/wiki/Q3545649","display_name":"Decoy","level":3,"score":0.9447662830352783},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8457422256469727},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6405267119407654},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6232234835624695},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5132200717926025},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.5080602169036865},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4676347076892853},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.393950492143631},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35590189695358276},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.12920716404914856},{"id":"https://openalex.org/C46141821","wikidata":"https://www.wikidata.org/wiki/Q209402","display_name":"Nuclear magnetic resonance","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C170493617","wikidata":"https://www.wikidata.org/wiki/Q208467","display_name":"Receptor","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1186/1471-2105-14-11","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-14-11","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-14-11","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:23323835","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/23323835","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:europepmc.org:2630407","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3626854","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-14-11","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-14-11","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-14-11","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320325651","display_name":"Alberta Innovates","ror":null},{"id":"https://openalex.org/F4320337169","display_name":"Alberta Prion Research Institute","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2092793778.pdf","grobid_xml":"https://content.openalex.org/works/W2092793778.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W242171001","https://openalex.org/W259338706","https://openalex.org/W1971627371","https://openalex.org/W1989777815","https://openalex.org/W2004461664","https://openalex.org/W2013792107","https://openalex.org/W2026469255","https://openalex.org/W2043812656","https://openalex.org/W2052963427","https://openalex.org/W2067516565","https://openalex.org/W2081287834","https://openalex.org/W2090003233","https://openalex.org/W2096635897","https://openalex.org/W2101649702","https://openalex.org/W2110483430","https://openalex.org/W2115817902","https://openalex.org/W2120412255","https://openalex.org/W2124371326","https://openalex.org/W2126630948","https://openalex.org/W2140190241","https://openalex.org/W2146134187","https://openalex.org/W2146413057","https://openalex.org/W2147717514","https://openalex.org/W2161151688","https://openalex.org/W2168282547","https://openalex.org/W2397770138","https://openalex.org/W4241935390"],"related_works":["https://openalex.org/W2038772855","https://openalex.org/W2415073839","https://openalex.org/W3004912075","https://openalex.org/W2173669824","https://openalex.org/W3045029306","https://openalex.org/W2107127921","https://openalex.org/W2913065212","https://openalex.org/W2944571611","https://openalex.org/W2128046947","https://openalex.org/W1972108315"],"abstract_inverted_index":{"BACKGROUND:":[0],"Structure-based":[1],"clustering":[2,25,43,76,110,169,211],"is":[3,162,189],"commonly":[4],"used":[5],"to":[6,103,117,191,232],"identify":[7],"correct":[8,126,149],"protein":[9,19,78],"folds":[10,13],"among":[11],"candidate":[12,62],"(also":[14],"called":[15],"decoys)":[16],"generated":[17],"by":[18,155],"structure":[20,229,244],"prediction":[21,230,245],"programs.":[22],"However,":[23],"traditional":[24],"methods":[26],"exhibit":[27],"a":[28,39,68,104],"poor":[29],"runtime":[30],"performance":[31,59,121,226],"on":[32,77,132],"large":[33],"decoy":[34,102,135,140,186,236],"sets.":[35],"We":[36,66,106],"hypothesized":[37],"that":[38,71,143,179],"more":[40],"efficient":[41],"\"partial\"":[42],"approach":[44],"in":[45,124],"combination":[46],"with":[47,112,234],"an":[48],"improved":[49,221],"scoring":[50,115],"scheme":[51,70],"could":[52],"significantly":[53,163,239],"improve":[54,147,240],"both":[55,119],"the":[56,120,148,206],"speed":[57,123],"and":[58,94,122,137,172,175,188,197,224,238],"of":[60,210],"existing":[61],"selection":[63],"methods.":[64],"RESULTS:":[65],"propose":[67],"new":[69,109,201],"performs":[72],"rapid":[73],"but":[74],"incomplete":[75],"decoys.":[79],"Our":[80],"method":[81,145,181],"detects":[82],"structurally":[83],"similar":[84],"decoys":[85],"(measured":[86],"using":[87],"either":[88],"C(\u03b1)":[89],"RMSD":[90],"or":[91,127],"GDT-TS":[92],"score)":[93],"extracts":[95],"representatives":[96],"from":[97],"them":[98],"without":[99],"assigning":[100],"every":[101,212],"cluster.":[105],"integrated":[107],"our":[108,144,180],"strategy":[111],"several":[113],"different":[114,157],"functions":[116],"assess":[118],"identifying":[125],"near-correct":[128],"folds.":[129],"Experimental":[130],"results":[131],"35":[133],"Rosetta":[134],"sets":[136,141,187,237],"40":[138],"I-TASSER":[139],"show":[142],"can":[146,182],"fold":[150],"detection":[151],"rate":[152],"as":[153],"assessed":[154],"two":[156,166],"quality":[158],"criteria.":[159],"This":[160],"improvement":[161],"better":[164],"than":[165,195],"recently":[167],"published":[168],"methods,":[170],"Durandal":[171,196],"Calibur-lite.":[173,198],"Speed":[174],"efficiency":[176,223],"testing":[177],"shows":[178],"handle":[183],"much":[184],"larger":[185,235],"up":[190],"22":[192],"times":[193],"faster":[194],"CONCLUSIONS:":[199],"The":[200],"method,":[202],"named":[203],"HS-Forest,":[204],"avoids":[205],"computationally":[207],"expensive":[208],"task":[209],"decoy,":[213],"yet":[214],"still":[215],"allows":[216],"superior":[217],"correct-fold":[218],"selection.":[219],"Its":[220],"speed,":[222],"decoy-selection":[225],"should":[227],"enable":[228],"researchers":[231],"work":[233],"their":[241],"ab":[242],"initio":[243],"performance.":[246]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":5}],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-10-10T00:00:00"}
