{"id":"https://openalex.org/W2170379807","doi":"https://doi.org/10.1186/1687-4153-2012-8","title":"Statistical discovery of site inter-dependencies in sub-molecular hierarchical protein structuring","display_name":"Statistical discovery of site inter-dependencies in sub-molecular hierarchical protein structuring","publication_year":2012,"publication_date":"2012-07-13","ids":{"openalex":"https://openalex.org/W2170379807","doi":"https://doi.org/10.1186/1687-4153-2012-8","mag":"2170379807","pmid":"https://pubmed.ncbi.nlm.nih.gov/22793672"},"language":"en","primary_location":{"id":"doi:10.1186/1687-4153-2012-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-4153-2012-8","pdf_url":"https://bsb-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-4153-2012-8","source":{"id":"https://openalex.org/S22696228","display_name":"EURASIP Journal on Bioinformatics and Systems Biology","issn_l":"1687-4145","issn":["1687-4145","1687-4153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Bioinformatics and Systems Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://bsb-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-4153-2012-8","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088523430","display_name":"Kirk K Durston","orcid":null},"institutions":[{"id":"https://openalex.org/I79817857","display_name":"University of Guelph","ror":"https://ror.org/01r7awg59","country_code":"CA","type":"education","lineage":["https://openalex.org/I79817857"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Kirk K Durston","raw_affiliation_strings":["School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada. kdurston@uoguelph.ca","School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada. kdurston@uoguelph.ca","institution_ids":["https://openalex.org/I79817857"]},{"raw_affiliation_string":"School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada","institution_ids":["https://openalex.org/I79817857"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102819493","display_name":"David Chiu","orcid":"https://orcid.org/0000-0002-1210-8268"},"institutions":[{"id":"https://openalex.org/I79817857","display_name":"University of Guelph","ror":"https://ror.org/01r7awg59","country_code":"CA","type":"education","lineage":["https://openalex.org/I79817857"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"David KY Chiu","raw_affiliation_strings":["School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, University of Guelph, 50 Stone Road East, Guelph, ON, N1G 2W1, Canada","institution_ids":["https://openalex.org/I79817857"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051841038","display_name":"Andrew K. C. Wong","orcid":"https://orcid.org/0000-0002-0019-7152"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Andrew KC Wong","raw_affiliation_strings":["Department of System Design Engineering, University of Waterloo, 200 University Ave. W, Waterloo, ON, N2L 3G1, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of System Design Engineering, University of Waterloo, 200 University Ave. W, Waterloo, ON, N2L 3G1, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015733852","display_name":"Gary C.L. Li","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Gary CL Li","raw_affiliation_strings":["Department of System Design Engineering, University of Waterloo, 200 University Ave. W, Waterloo, ON, N2L 3G1, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of System Design Engineering, University of Waterloo, 200 University Ave. W, Waterloo, ON, N2L 3G1, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5088523430"],"corresponding_institution_ids":["https://openalex.org/I79817857"],"apc_list":null,"apc_paid":null,"fwci":0.5374,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.66751139,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"2012","issue":"1","first_page":"8","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11305","display_name":"Amyloidosis: Diagnosis, Treatment, Outcomes","score":0.2500999867916107,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11305","display_name":"Amyloidosis: Diagnosis, Treatment, Outcomes","score":0.2500999867916107,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.15800000727176666,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T14135","display_name":"Cancer and biochemical research","score":0.054499998688697815,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.646178126335144},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.6156508326530457},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.535371720790863},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5234267711639404},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.4873117208480835},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4816693067550659},{"id":"https://openalex.org/keywords/protein-domain","display_name":"Protein domain","score":0.4585210680961609},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4417960047721863},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.4357760548591614},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.3836812376976013},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.24497580528259277},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18900233507156372},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.1803615689277649}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.646178126335144},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.6156508326530457},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.535371720790863},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5234267711639404},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.4873117208480835},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4816693067550659},{"id":"https://openalex.org/C144292202","wikidata":"https://www.wikidata.org/wiki/Q898273","display_name":"Protein domain","level":3,"score":0.4585210680961609},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4417960047721863},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.4357760548591614},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.3836812376976013},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.24497580528259277},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18900233507156372},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.1803615689277649},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1186/1687-4153-2012-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-4153-2012-8","pdf_url":"https://bsb-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-4153-2012-8","source":{"id":"https://openalex.org/S22696228","display_name":"EURASIP Journal on Bioinformatics and Systems Biology","issn_l":"1687-4145","issn":["1687-4145","1687-4153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Bioinformatics and Systems Biology","raw_type":"journal-article"},{"id":"pmid:22793672","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/22793672","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP journal on bioinformatics & systems biology","raw_type":null},{"id":"pmh:oai:europepmc.org:2541581","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3524763","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1687-4153-2012-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-4153-2012-8","pdf_url":"https://bsb-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-4153-2012-8","source":{"id":"https://openalex.org/S22696228","display_name":"EURASIP Journal on Bioinformatics and Systems Biology","issn_l":"1687-4145","issn":["1687-4145","1687-4153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Bioinformatics and Systems Biology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310304","display_name":"Advanced Foods and Materials Network","ror":"https://ror.org/0149a7069"},{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2170379807.pdf","grobid_xml":"https://content.openalex.org/works/W2170379807.grobid-xml"},"referenced_works_count":56,"referenced_works":["https://openalex.org/W90286923","https://openalex.org/W1491063910","https://openalex.org/W1502030261","https://openalex.org/W1503339369","https://openalex.org/W1504062128","https://openalex.org/W1538614106","https://openalex.org/W1542313442","https://openalex.org/W1900102636","https://openalex.org/W1947957290","https://openalex.org/W1965533615","https://openalex.org/W1969700934","https://openalex.org/W1982996449","https://openalex.org/W1986461448","https://openalex.org/W1987063515","https://openalex.org/W2004105868","https://openalex.org/W2009821000","https://openalex.org/W2013785414","https://openalex.org/W2019503106","https://openalex.org/W2042211659","https://openalex.org/W2043290117","https://openalex.org/W2044460749","https://openalex.org/W2045507971","https://openalex.org/W2048412098","https://openalex.org/W2050043175","https://openalex.org/W2062666353","https://openalex.org/W2071905696","https://openalex.org/W2072325671","https://openalex.org/W2072927313","https://openalex.org/W2094534479","https://openalex.org/W2095313649","https://openalex.org/W2099598754","https://openalex.org/W2100271852","https://openalex.org/W2106014491","https://openalex.org/W2111527303","https://openalex.org/W2114383673","https://openalex.org/W2121053863","https://openalex.org/W2121082582","https://openalex.org/W2121520117","https://openalex.org/W2121615969","https://openalex.org/W2128933128","https://openalex.org/W2132520255","https://openalex.org/W2137991504","https://openalex.org/W2141885858","https://openalex.org/W2154500141","https://openalex.org/W2156012420","https://openalex.org/W2158012006","https://openalex.org/W2321516322","https://openalex.org/W2342048953","https://openalex.org/W2407359617","https://openalex.org/W2788557154","https://openalex.org/W2907227701","https://openalex.org/W3022020637","https://openalex.org/W4210323379","https://openalex.org/W4242150647","https://openalex.org/W4251551014","https://openalex.org/W4253407057"],"related_works":["https://openalex.org/W3200375535","https://openalex.org/W2118652015","https://openalex.org/W1999731297","https://openalex.org/W2130123090","https://openalex.org/W2126196981","https://openalex.org/W2121125726","https://openalex.org/W2038360534","https://openalex.org/W2157362913","https://openalex.org/W1972763041","https://openalex.org/W2121031136"],"abstract_inverted_index":{"BACKGROUND:":[0],"Much":[1],"progress":[2],"has":[3],"been":[4],"made":[5],"in":[6,126,271],"understanding":[7],"the":[8,38,54,66,69,92,97,109,121,136,148,165,192,228,243,272,282,312,319],"3D":[9,23,56,93,149,320],"structure":[10,39,58,150,231,274,321],"of":[11,41,59,68,74,81,99,133,151,210,232,252,263,304,322],"proteins":[12,306],"using":[13,287],"methods":[14],"such":[15],"as":[16,201],"NMR":[17],"and":[18,35,123,184,194,234],"X-ray":[19],"crystallography.":[20],"The":[21,157,175],"resulting":[22],"structures":[24],"are":[25,40,46,84],"extremely":[26],"informative,":[27],"but":[28],"do":[29],"not":[30],"always":[31],"reveal":[32,96],"which":[33,222,264],"sites":[34,83,134,255,298],"residues":[36],"within":[37,53,91,108,135,147,227,239,318],"special":[42],"importance.":[43],"Recently,":[44],"there":[45],"indications":[47],"that":[48,281],"multiple-residue,":[49],"sub-domain":[50,106,238],"structural":[51,225,316],"relationships":[52,90,317],"larger":[55],"consensus":[57],"a":[60,75,113,170,202,235,288,301,323],"protein":[61,76,154,196,260,324],"can":[62,307],"be":[63],"inferred":[64],"from":[65,300],"analysis":[67],"multiple":[70,137,198],"sequence":[71,138,199,302],"alignment":[72,303],"data":[73],"family.":[77,325],"These":[78,213],"intra-dependent":[79],"clusters":[80,176,214,251],"associated":[82,241],"used":[85],"to":[86,120,128,179,191,266],"indicate":[87],"hierarchical":[88,314],"inter-residue":[89,315],"structure.":[94],"To":[95],"patterns":[98],"associations":[100,130,145,209],"among":[101,131,245,297],"individual":[102],"amino":[103],"acids":[104],"or":[105,182],"components":[107,181],"structure,":[110],"we":[111,162,205,284],"apply":[112],"k-modes":[114,158,289],"attribute":[115],"(aligned":[116],"site)":[117],"clustering":[118,160,291],"algorithm":[119,161,292],"ubiquitin":[122,193,233],"transthyretin":[124,195,240,246],"families":[125],"order":[127],"discover":[129],"groups":[132],"alignment.":[139],"We":[140],"then":[141,216],"observe":[142],"what":[143],"these":[144,152],"imply":[146],"two":[153],"families.":[155],"RESULTS:":[156],"site":[159,290],"developed":[163],"maximizes":[164],"intra-group":[166],"interdependencies":[167],"based":[168,293],"on":[169,294],"normalized":[171],"mutual":[172],"information":[173],"measure.":[174],"formed":[177],"correspond":[178],"sub-structural":[180],"binding":[183],"interface":[185,244],"locations.":[186],"Applying":[187],"this":[188],"data-directed":[189],"method":[190,283],"family":[197],"alignments":[200],"test":[203],"bed,":[204],"located":[206],"numerous":[207],"interesting":[208],"interdependent":[211,254],"sites.":[212],"were":[215,256],"arranged":[217],"into":[218,311],"cluster":[219],"tree":[220],"diagrams":[221],"revealed":[223],"four":[224],"sub-domains":[226],"single":[229,236],"domain":[230],"large":[237],"with":[242],"monomers.":[247],"In":[248],"addition,":[249],"several":[250],"mutually":[253],"discovered":[257],"for":[258],"each":[259,262],"family,":[261],"appear":[265],"play":[267],"an":[268],"important":[269],"role":[270],"molecular":[273],"and/or":[275],"function.":[276],"CONCLUSIONS:":[277],"Our":[278],"results":[279],"demonstrate":[280],"present":[285],"here":[286],"interdependency":[295],"evaluation":[296],"obtained":[299],"homologous":[305],"provide":[308],"significant":[309],"insights":[310],"complex,":[313]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
