{"id":"https://openalex.org/W2024233062","doi":"https://doi.org/10.1145/2506583.2506697","title":"Revealing Protein Structures by Co-Occurrence Clustering of Aligned Pattern Clusters","display_name":"Revealing Protein Structures by Co-Occurrence Clustering of Aligned Pattern Clusters","publication_year":2013,"publication_date":"2013-09-22","ids":{"openalex":"https://openalex.org/W2024233062","doi":"https://doi.org/10.1145/2506583.2506697","mag":"2024233062"},"language":"en","primary_location":{"id":"doi:10.1145/2506583.2506697","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2506583.2506697","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on Bioinformatics, Computational Biology and Biomedical Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067575670","display_name":"Sanderz Fung","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Sanderz Fung","raw_affiliation_strings":["Systems Design Engineering, University of Waterloo, Waterloo, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Systems Design Engineering, University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054354683","display_name":"En-Shiun Annie Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"En-Shiun Annie Lee","raw_affiliation_strings":["Systems Design Engineering, University of Waterloo, Waterloo, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Systems Design Engineering, University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051841038","display_name":"Andrew K. C. Wong","orcid":"https://orcid.org/0000-0002-0019-7152"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Andrew K.C. Wong","raw_affiliation_strings":["Systems Design Engineering, University of Waterloo, Waterloo, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Systems Design Engineering, University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07294085,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"869","last_page":"875"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6287927627563477},{"id":"https://openalex.org/keywords/protein-family","display_name":"Protein family","score":0.5782337188720703},{"id":"https://openalex.org/keywords/loop-modeling","display_name":"Loop modeling","score":0.546654224395752},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.5309234261512756},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5293259024620056},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.5279107689857483},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.5122184157371521},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.48846927285194397},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.46214020252227783},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.3838666081428528},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.36597853899002075},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.3537747859954834},{"id":"https://openalex.org/keywords/protein-structure-prediction","display_name":"Protein structure prediction","score":0.31749075651168823},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.21104338765144348},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.13149061799049377},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1289406716823578}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6287927627563477},{"id":"https://openalex.org/C171897839","wikidata":"https://www.wikidata.org/wiki/Q417841","display_name":"Protein family","level":3,"score":0.5782337188720703},{"id":"https://openalex.org/C45475804","wikidata":"https://www.wikidata.org/wiki/Q6675846","display_name":"Loop modeling","level":4,"score":0.546654224395752},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.5309234261512756},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5293259024620056},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.5279107689857483},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.5122184157371521},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.48846927285194397},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.46214020252227783},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.3838666081428528},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36597853899002075},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.3537747859954834},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.31749075651168823},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.21104338765144348},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.13149061799049377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1289406716823578},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2506583.2506697","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2506583.2506697","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on Bioinformatics, Computational Biology and Biomedical Informatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1938740620","https://openalex.org/W1990368529","https://openalex.org/W2016661940","https://openalex.org/W2051224630","https://openalex.org/W2051664277","https://openalex.org/W2053238682","https://openalex.org/W2130479394","https://openalex.org/W2132629607","https://openalex.org/W2134089414","https://openalex.org/W2163105490","https://openalex.org/W6631828510"],"related_works":["https://openalex.org/W2013950502","https://openalex.org/W3204091482","https://openalex.org/W3171039768","https://openalex.org/W1644669973","https://openalex.org/W2181585194","https://openalex.org/W1543174845","https://openalex.org/W2253761889","https://openalex.org/W2802527233","https://openalex.org/W646353556","https://openalex.org/W3215498386"],"abstract_inverted_index":{"Proteins":[0],"can":[1,42],"be":[2],"represented":[3,15,103],"in":[4,82,97,129,214,225,235],"several":[5],"ways,":[6],"including":[7],"primary":[8],"protein":[9,13,39,45,52,62,71,77,98,174,211,244],"sequence,":[10],"where":[11,25],"the":[12,26,37,59,118,130,142,162,165,194,198,217,236,246,253,262],"is":[14,28,67,135,159],"as":[16,104],"a":[17,31,250,257],"string":[18],"of":[19,61,70,76,156,164,243],"amino":[20],"acids,":[21],"and":[22,91,102,178,200,220,261,275],"three-dimensional":[23,63,84,186,226],"structure,":[24],"sequence":[27,78,88,95],"folded":[29],"into":[30,151],"structure.":[32],"By":[33],"analyzing":[34],"proteins":[35,283],"from":[36,240,285],"same":[38,119],"family,":[40,53],"we":[41],"find":[43,80],"conserved":[44],"regions":[46],"that":[47,51,123,232],"are":[48,100,145,182,233,277],"common":[49,234],"within":[50],"gaining":[54],"biological":[55],"knowledge.":[56],"Compared":[57],"to":[58,79,137,148,160,172,188,191],"amount":[60],"structures":[64,85,187],"available,":[65],"there":[66],"an":[68,286],"abundance":[69],"sequences,":[72],"hence,":[73],"making":[74],"analysis":[75],"characteristics":[81,231],"its":[83],"crucial.":[86],"Through":[87],"pattern":[89],"discovery":[90],"alignment,":[92],"statistically":[93],"significant":[94],"patterns":[96],"families":[99,212],"found":[101,229],"Aligned":[105],"Pattern":[106],"Clusters":[107],"(APCs).":[108],"When":[109],"two":[110,173],"or":[111],"more":[112,268],"APCs":[113,150,222,266],"occur":[114],"frequently":[115],"together":[116,125],"on":[117],"protein,":[120],"this":[121,157],"implies":[122],"they":[124],"have":[126],"important":[127,282],"relationship":[128,140],"protein.":[131],"A":[132],"co-occurrence":[133,259],"score":[134],"used":[136,147],"quantify":[138],"such":[139],"between":[141],"APCs,":[143],"which":[144],"further":[146],"cluster":[149,248,255,264],"APC":[152,238,247,254,263],"clusters.":[153],"The":[154,180,207],"purpose":[155],"paper":[158],"examine":[161,192],"validate":[163],"proposed":[166],"method":[167,171,274],"by":[168,281],"applying":[169],"our":[170,273],"families,":[175],"triosephosphate":[176],"isomerase":[177],"G-alpha.":[179],"results":[181,195,208,276],"then":[183],"verified":[184,280],"using":[185],"check":[189],"both":[190,210,241],"whether":[193],"comply":[196,213],"with":[197,203,216,267],"structure":[199],"how":[201],"often":[202],"different":[204],"known":[205,218],"structures.":[206],"for":[209],"majority":[215],"structures,":[219],"their":[221],"were":[223],"close":[224],"distance.":[227],"We":[228],"three":[230],"resulting":[237],"clusters":[239],"sets":[242],"data:":[245],"forming":[249],"complete":[251],"graph,":[252],"having":[256],"high":[258],"score,":[260],"containing":[265],"than":[269],"one":[270],"patterns.":[271],"Furthermore,":[272],"currently":[278],"being":[279],"crystallized":[284],"immunology":[287],"lab.":[288]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
