{"id":"https://openalex.org/W1983939461","doi":"https://doi.org/10.1142/s0219720005001648","title":"COVARIATION ANALYSIS OF LOCAL AMINO ACID SEQUENCES IN RECURRENT PROTEIN LOCAL STRUCTURES","display_name":"COVARIATION ANALYSIS OF LOCAL AMINO ACID SEQUENCES IN RECURRENT PROTEIN LOCAL STRUCTURES","publication_year":2005,"publication_date":"2005-12-01","ids":{"openalex":"https://openalex.org/W1983939461","doi":"https://doi.org/10.1142/s0219720005001648","mag":"1983939461","pmid":"https://pubmed.ncbi.nlm.nih.gov/16374913"},"language":"en","primary_location":{"id":"doi:10.1142/s0219720005001648","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720005001648","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023809838","display_name":"Lu-yong Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]},{"id":"https://openalex.org/I4210137693","display_name":"Siemens (United States)","ror":"https://ror.org/04axb7e79","country_code":"US","type":"company","lineage":["https://openalex.org/I1325886976","https://openalex.org/I4210137693"]},{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"LU-YONG WANG","raw_affiliation_strings":["Integrated Data Systems Department, Siemens Corporate Research and Center for Computational Biology &amp; Bioingormatics, Columbia University, 755, College Road East, Princeton, New Jersey, 08540, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Integrated Data Systems Department, Siemens Corporate Research and Center for Computational Biology &amp; Bioingormatics, Columbia University, 755, College Road East, Princeton, New Jersey, 08540, USA","institution_ids":["https://openalex.org/I20089843","https://openalex.org/I78577930","https://openalex.org/I4210137693"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5023809838"],"corresponding_institution_ids":["https://openalex.org/I20089843","https://openalex.org/I4210137693","https://openalex.org/I78577930"],"apc_list":null,"apc_paid":null,"fwci":0.379,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.58594307,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"03","issue":"06","first_page":"1391","last_page":"1409"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11162","display_name":"Enzyme Structure and Function","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.7800010442733765},{"id":"https://openalex.org/keywords/structural-alignment","display_name":"Structural alignment","score":0.6901717185974121},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.5145061016082764},{"id":"https://openalex.org/keywords/protein-folding","display_name":"Protein folding","score":0.46740180253982544},{"id":"https://openalex.org/keywords/residue","display_name":"Residue (chemistry)","score":0.46447551250457764},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.46153271198272705},{"id":"https://openalex.org/keywords/local-structure","display_name":"Local structure","score":0.46036091446876526},{"id":"https://openalex.org/keywords/protein-tertiary-structure","display_name":"Protein tertiary structure","score":0.4490422308444977},{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.4395102858543396},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.42377611994743347},{"id":"https://openalex.org/keywords/structural-motif","display_name":"Structural motif","score":0.4236491918563843},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.42359983921051025},{"id":"https://openalex.org/keywords/amino-acid-residue","display_name":"Amino acid residue","score":0.42114561796188354},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3627740740776062},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.32588309049606323},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.23626866936683655},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.22851762175559998},{"id":"https://openalex.org/keywords/crystallography","display_name":"Crystallography","score":0.21596696972846985},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.14026713371276855},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.07564577460289001}],"concepts":[{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.7800010442733765},{"id":"https://openalex.org/C4668613","wikidata":"https://www.wikidata.org/wiki/Q4116110","display_name":"Structural alignment","level":5,"score":0.6901717185974121},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.5145061016082764},{"id":"https://openalex.org/C204328495","wikidata":"https://www.wikidata.org/wiki/Q847556","display_name":"Protein folding","level":2,"score":0.46740180253982544},{"id":"https://openalex.org/C2781338088","wikidata":"https://www.wikidata.org/wiki/Q903495","display_name":"Residue (chemistry)","level":2,"score":0.46447551250457764},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.46153271198272705},{"id":"https://openalex.org/C2986090443","wikidata":"https://www.wikidata.org/wiki/Q77870413","display_name":"Local structure","level":2,"score":0.46036091446876526},{"id":"https://openalex.org/C75599170","wikidata":"https://www.wikidata.org/wiki/Q898483","display_name":"Protein tertiary structure","level":2,"score":0.4490422308444977},{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.4395102858543396},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.42377611994743347},{"id":"https://openalex.org/C132677234","wikidata":"https://www.wikidata.org/wiki/Q3273544","display_name":"Structural motif","level":2,"score":0.4236491918563843},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.42359983921051025},{"id":"https://openalex.org/C2994376932","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Amino acid residue","level":4,"score":0.42114561796188354},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3627740740776062},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.32588309049606323},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.23626866936683655},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.22851762175559998},{"id":"https://openalex.org/C8010536","wikidata":"https://www.wikidata.org/wiki/Q160398","display_name":"Crystallography","level":1,"score":0.21596696972846985},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.14026713371276855},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.07564577460289001},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008956","descriptor_name":"Models, Chemical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000032","qualifier_name":"analysis","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D013223","descriptor_name":"Statistics as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013223","descriptor_name":"Statistics as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013223","descriptor_name":"Statistics as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1142/s0219720005001648","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720005001648","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},{"id":"pmid:16374913","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/16374913","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of bioinformatics and computational biology","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1495099700","https://openalex.org/W1588812136","https://openalex.org/W1985420739","https://openalex.org/W1992366400","https://openalex.org/W2000834633","https://openalex.org/W2005049999","https://openalex.org/W2014095962","https://openalex.org/W2032643862","https://openalex.org/W2033314834","https://openalex.org/W2053721311","https://openalex.org/W2055827177","https://openalex.org/W2074655761","https://openalex.org/W2083098259","https://openalex.org/W2094559779","https://openalex.org/W2105880172","https://openalex.org/W2107100754","https://openalex.org/W2107165577","https://openalex.org/W2118756701","https://openalex.org/W2124649680","https://openalex.org/W2136011546","https://openalex.org/W2137995988","https://openalex.org/W2151687360","https://openalex.org/W2152099594","https://openalex.org/W2166298363","https://openalex.org/W2171641243","https://openalex.org/W2461704835","https://openalex.org/W3047703793","https://openalex.org/W3148560526"],"related_works":["https://openalex.org/W1482324242","https://openalex.org/W2051969447","https://openalex.org/W2187357871","https://openalex.org/W2111937814","https://openalex.org/W2084367350","https://openalex.org/W2029514038","https://openalex.org/W1985408726","https://openalex.org/W2602307348","https://openalex.org/W2220384852","https://openalex.org/W2137427011"],"abstract_inverted_index":{"Local":[0],"structural":[1,42,95,181,210,220],"information":[2,211],"is":[3,121,212],"supposed":[4],"to":[5],"be":[6],"frequently":[7],"encoded":[8,213],"in":[9,27,39,78,93,97,126,133,168,179,196,214,226],"local":[10,20,30,41,62,73,94,135,169,180,191,209,215,219],"amino":[11,129],"acid":[12,130],"sequences.":[13],"Previous":[14],"research":[15],"only":[16],"indicated":[17],"that":[18,85,143,187,207],"some":[19,28,208],"structure":[21],"positions":[22],"have":[23,47],"specific":[24],"residue":[25,87,104,131,141,162],"preferences":[26],"particular":[29,98],"structures.":[31,136],"However,":[32],"correlated":[33,140],"pairwise":[34,128],"replacements":[35],"for":[36],"interacting":[37],"residues":[38],"recurrent":[40,72,134],"motifs":[43,182],"from":[44,75,171,183],"unrelated":[45,76,172,184],"proteins":[46,77,185],"not":[48,145],"been":[49],"studied":[50],"systematically.":[51],"We":[52,137],"introduced":[53],"a":[54,123],"new":[55],"method":[56],"fusing":[57],"statistical":[58,90,165],"covariation":[59],"analysis":[60,66],"and":[61,100,217],"structure-based":[63,68],"alignment.":[64],"Systematic":[65],"of":[67,71,81,176,190],"multiple":[69],"alignments":[70],"structures":[74,170,199],"representative":[79],"subset":[80],"Protein":[82],"Databank":[83],"indicates":[84,186],"covarying":[86,161],"pairs":[88,105,142,163],"with":[89,113,148,164],"significance":[91,166],"exist":[92,167],"motifs,":[96],"beta-turns":[99],"helix":[101],"caps.":[102],"These":[103],"are":[106,144,157,193],"mostly":[107],"linked":[108,147],"through":[109],"polar":[110],"functional":[111],"groups":[112],"direct":[114],"or":[115],"indirect":[116],"hydrogen":[117],"bonding.":[118],"Hydrophobic":[119],"interaction":[120],"also":[122,138],"major":[124],"factor":[125],"constraining":[127],"replacement":[132],"found":[139],"clearly":[146],"through-space":[149],"interactions.":[150],"The":[151,174],"physical":[152],"constrains":[153],"underlying":[154],"these":[155],"covariations":[156,178],"less":[158],"clear.":[159],"Overall,":[160],"proteins.":[173],"existence":[175],"sequence":[177],"many":[188],"relics":[189],"relations":[192],"still":[194],"retained":[195],"the":[197,205,218],"tertiary":[198],"after":[200],"protein":[201,230],"folding.":[202],"It":[203],"supports":[204],"notion":[206],"sequences":[216],"codes":[221],"could":[222],"play":[223],"important":[224],"roles":[225],"determining":[227],"native":[228],"state":[229],"folding":[231],"topology.":[232]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
