{"id":"https://openalex.org/W2115533746","doi":"https://doi.org/10.1145/1562090.1562096","title":"Protein sequence alignment and structural disorder","display_name":"Protein sequence alignment and structural disorder","publication_year":2009,"publication_date":"2009-06-28","ids":{"openalex":"https://openalex.org/W2115533746","doi":"https://doi.org/10.1145/1562090.1562096","mag":"2115533746"},"language":"en","primary_location":{"id":"doi:10.1145/1562090.1562096","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1562090.1562096","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the KDD-09 Workshop on Statistical and Relational Learning in Bioinformatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007397401","display_name":"Uros Midic","orcid":null},"institutions":[{"id":"https://openalex.org/I84392919","display_name":"Temple University","ror":"https://ror.org/00kx1jb78","country_code":"US","type":"education","lineage":["https://openalex.org/I84392919"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Uros Midic","raw_affiliation_strings":["Temple University, Philadelphia, PA",", Temple University, Philadelphia, PA"],"affiliations":[{"raw_affiliation_string":"Temple University, Philadelphia, PA","institution_ids":["https://openalex.org/I84392919"]},{"raw_affiliation_string":", Temple University, Philadelphia, PA","institution_ids":["https://openalex.org/I84392919"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017746551","display_name":"A. Keith Dunker","orcid":"https://orcid.org/0000-0002-0744-5243"},"institutions":[{"id":"https://openalex.org/I55769427","display_name":"Indiana University \u2013 Purdue University Indianapolis","ror":"https://ror.org/05gxnyn08","country_code":"US","type":"education","lineage":["https://openalex.org/I55769427","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. Keith Dunker","raw_affiliation_strings":["Indiana University, Indianapolis, IN"],"affiliations":[{"raw_affiliation_string":"Indiana University, Indianapolis, IN","institution_ids":["https://openalex.org/I55769427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044038055","display_name":"Zoran Obradovi\u0107","orcid":"https://orcid.org/0000-0002-2051-0142"},"institutions":[{"id":"https://openalex.org/I84392919","display_name":"Temple University","ror":"https://ror.org/00kx1jb78","country_code":"US","type":"education","lineage":["https://openalex.org/I84392919"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zoran Obradovic","raw_affiliation_strings":["Temple University, Philadelphia, PA",", Temple University, Philadelphia, PA"],"affiliations":[{"raw_affiliation_string":"Temple University, Philadelphia, PA","institution_ids":["https://openalex.org/I84392919"]},{"raw_affiliation_string":", Temple University, Philadelphia, PA","institution_ids":["https://openalex.org/I84392919"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5007397401"],"corresponding_institution_ids":["https://openalex.org/I84392919"],"apc_list":null,"apc_paid":null,"fwci":0.2625,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.59447849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"27","last_page":"31"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11162","display_name":"Enzyme Structure and Function","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substitution","display_name":"Substitution (logic)","score":0.67512446641922},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6535686254501343},{"id":"https://openalex.org/keywords/block-matrix","display_name":"Block matrix","score":0.5782209634780884},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.5365512371063232},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.46667468547821045},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.45493823289871216},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.43526825308799744},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.4256003499031067},{"id":"https://openalex.org/keywords/amino-acid","display_name":"Amino acid","score":0.42505955696105957},{"id":"https://openalex.org/keywords/structural-alignment","display_name":"Structural alignment","score":0.4193316698074341},{"id":"https://openalex.org/keywords/alphabet","display_name":"Alphabet","score":0.4111907482147217},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.39369913935661316},{"id":"https://openalex.org/keywords/crystallography","display_name":"Crystallography","score":0.33669817447662354},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33007484674453735},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.30435436964035034},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24584805965423584},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.23669904470443726},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.2014521360397339},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2001270055770874},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.14547300338745117}],"concepts":[{"id":"https://openalex.org/C2778220771","wikidata":"https://www.wikidata.org/wiki/Q1522579","display_name":"Substitution (logic)","level":2,"score":0.67512446641922},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6535686254501343},{"id":"https://openalex.org/C85817219","wikidata":"https://www.wikidata.org/wiki/Q884772","display_name":"Block matrix","level":3,"score":0.5782209634780884},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.5365512371063232},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.46667468547821045},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45493823289871216},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.43526825308799744},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.4256003499031067},{"id":"https://openalex.org/C515207424","wikidata":"https://www.wikidata.org/wiki/Q8066","display_name":"Amino acid","level":2,"score":0.42505955696105957},{"id":"https://openalex.org/C4668613","wikidata":"https://www.wikidata.org/wiki/Q4116110","display_name":"Structural alignment","level":5,"score":0.4193316698074341},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.4111907482147217},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.39369913935661316},{"id":"https://openalex.org/C8010536","wikidata":"https://www.wikidata.org/wiki/Q160398","display_name":"Crystallography","level":1,"score":0.33669817447662354},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33007484674453735},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.30435436964035034},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24584805965423584},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.23669904470443726},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.2014521360397339},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2001270055770874},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.14547300338745117},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1562090.1562096","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1562090.1562096","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the KDD-09 Workshop on Statistical and Relational Learning in Bioinformatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6887030710","display_name":null,"funder_award_id":"R56 LM007688-05A1","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1531116739","https://openalex.org/W1792685479","https://openalex.org/W1975472870","https://openalex.org/W2049476357","https://openalex.org/W2055043387","https://openalex.org/W2073745520","https://openalex.org/W2074231493","https://openalex.org/W2077797834","https://openalex.org/W2087064593","https://openalex.org/W2095724872","https://openalex.org/W2117237768","https://openalex.org/W2125022522","https://openalex.org/W2143210482","https://openalex.org/W4210968583"],"related_works":["https://openalex.org/W2029514038","https://openalex.org/W2088487249","https://openalex.org/W2111937814","https://openalex.org/W2051969447","https://openalex.org/W1985408726","https://openalex.org/W2061567716","https://openalex.org/W2130940308","https://openalex.org/W2084367350","https://openalex.org/W1981307089","https://openalex.org/W2092691595"],"abstract_inverted_index":{"In":[0,197,233],"protein":[1,262],"sequence":[2,85,142,291],"alignment":[3,10,118,171,260,292],"algorithms,":[4],"a":[5,57,71,211,305],"substitution":[6,29,115,166,213,270,278,286],"matrix":[7,167,182,237,271,287],"of":[8,18,27,97,112,119,134,172,195,227,261,293],"20x20":[9,184,244],"parameters":[11],"is":[12,88,168,272,288,301],"used":[13,207],"to":[14,63,94,146,188,208,224,247,304],"describe":[15,201],"the":[16,32,84,113,130,132,139,176,225,228,231,234,243,268,276,281,284],"rates":[17],"amino":[19,74,151,159],"acid":[20,75],"substitutions":[21],"over":[22],"time.":[23],"Development":[24],"and":[25,102,156,192,250],"evaluation":[26],"most":[28],"matrices":[30,116],"including":[31],"BLOSUM":[33,114,277,306],"family":[34],"[1]":[35],"was":[36],"based":[37],"almost":[38],"entirely":[39],"on":[40,110],"fully":[41,294],"structured":[42,95,101],"proteins.":[43],"Structurally":[44],"disordered":[45,121,154,266],"proteins":[46,48,81,98,122,296],"(i.e.":[47,79],"that":[49,59,186,205,258,264],"lack":[50],"structure,":[51],"either":[52],"in":[53,67,90,153,161,175,230],"part":[54],"or":[55],"as":[56,92,297],"whole)":[58],"have":[60,70],"been":[61],"shown":[62],"be":[64],"very":[65,302],"common":[66],"nature":[68],"[2]":[69],"significantly":[72],"different":[73],"composition":[76],"than":[77,275],"ordered":[78,162,295],"structured)":[80],"[3].":[82],"Furthermore,":[83],"evolution":[86],"rate":[87],"higher":[89],"unstructured":[91,103],"compared":[93],"regions":[96,104,155],"containing":[99],"both":[100],"[4].":[105],"These":[106,254],"results":[107,221],"cast":[108],"doubt":[109],"appropriateness":[111],"for":[117,141,150,158,170,259,290],"structurally":[120],"[5].To":[123],"address":[124],"this":[125,198],"problem,":[126],"we":[127,200,206,238],"take":[128],"into":[129],"account":[131],"concept":[133],"structural":[135],"disorder":[136],"by":[137],"extending":[138],"alphabet":[140],"representation":[143],"from":[144],"20":[145,149,157],"2x20=40":[147],"symbols,":[148],"acids":[152,160],"regions.":[163],"A":[164],"40x40":[165,212,236],"required":[169],"sequences":[173,229,263],"represented":[174],"extended":[177],"alphabet.":[178],"Such":[179],"an":[180,202],"expanded":[181],"contains":[183],"submatrices":[185,245],"correspond":[187],"matching":[189],"ordered-ordered,":[190,248],"ordered-disordered,":[191,249],"disordered-disordered":[193,251],"pairs":[194],"residues.":[196],"paper":[199],"iterative":[203,216],"procedure":[204,217],"estimate":[209],"such":[210],"matrix.":[214,307],"The":[215],"converged":[218],"with":[219,222],"stable":[220],"respect":[223],"choice":[226],"dataset.":[232],"obtained":[235],"found":[239],"substantial":[240],"differences":[241,255],"between":[242],"corresponding":[246],"region":[252],"matching.":[253],"provide":[256],"evidence":[257],"contain":[265],"segments,":[267],"discovered":[269],"more":[273],"appropriate":[274],"matrices.":[279],"At":[280],"same":[282],"time,":[283],"new":[285],"applicable":[289],"its":[298],"order-order":[299],"submatrix":[300],"similar":[303]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
