{"id":"https://openalex.org/W2402064298","doi":"https://doi.org/10.1371/journal.pcbi.1004936","title":"Bayesian Top-Down Protein Sequence Alignment with Inferred Position-Specific Gap Penalties","display_name":"Bayesian Top-Down Protein Sequence Alignment with Inferred Position-Specific Gap Penalties","publication_year":2016,"publication_date":"2016-05-18","ids":{"openalex":"https://openalex.org/W2402064298","doi":"https://doi.org/10.1371/journal.pcbi.1004936","mag":"2402064298","pmid":"https://pubmed.ncbi.nlm.nih.gov/27192614"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1004936","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1004936","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1004936&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1004936&type=printable","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010571747","display_name":"Andrew F. Neuwald","orcid":"https://orcid.org/0000-0002-0086-5755"},"institutions":[{"id":"https://openalex.org/I126744593","display_name":"University of Maryland, Baltimore","ror":"https://ror.org/04rq5mt64","country_code":"US","type":"education","lineage":["https://openalex.org/I126744593"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Andrew F. Neuwald","raw_affiliation_strings":["Institute for Genome Sciences and Department of Biochemistry & Molecular Biology, University of Maryland School of Medicine, Baltimore, Maryland, United States of America"],"affiliations":[{"raw_affiliation_string":"Institute for Genome Sciences and Department of Biochemistry & Molecular Biology, University of Maryland School of Medicine, Baltimore, Maryland, United States of America","institution_ids":["https://openalex.org/I126744593"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015061000","display_name":"Stephen F. Altschul","orcid":"https://orcid.org/0000-0003-2120-9631"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210109390","display_name":"National Center for Biotechnology Information","ror":"https://ror.org/02meqm098","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I2800548410","https://openalex.org/I4210109390"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stephen F. Altschul","raw_affiliation_strings":["National Center for Biotechnology Information, National Library of Medicine, National Institutes of Health, Bethesda, Maryland, United States of America"],"affiliations":[{"raw_affiliation_string":"National Center for Biotechnology Information, National Library of Medicine, National Institutes of Health, Bethesda, Maryland, United States of America","institution_ids":["https://openalex.org/I4210109390","https://openalex.org/I1299303238"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5010571747"],"corresponding_institution_ids":["https://openalex.org/I126744593"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":2655,"currency":"USD","value_usd":2655},"fwci":1.7405,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.84707001,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"12","issue":"5","first_page":"e1004936","last_page":"e1004936"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.7672221660614014},{"id":"https://openalex.org/keywords/markov-chain-monte-carlo","display_name":"Markov chain Monte Carlo","score":0.6209053993225098},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6135230660438538},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.569407045841217},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.5623760223388672},{"id":"https://openalex.org/keywords/alignment-free-sequence-analysis","display_name":"Alignment-free sequence analysis","score":0.5485251545906067},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.546933114528656},{"id":"https://openalex.org/keywords/indel","display_name":"Indel","score":0.4594053328037262},{"id":"https://openalex.org/keywords/structural-alignment","display_name":"Structural alignment","score":0.44709107279777527},{"id":"https://openalex.org/keywords/dirichlet-distribution","display_name":"Dirichlet distribution","score":0.44559550285339355},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.42771345376968384},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.40884366631507874},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3506205081939697},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3145331144332886},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2621609568595886},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2264626920223236},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.20582666993141174},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.13203269243240356},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.12987565994262695}],"concepts":[{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.7672221660614014},{"id":"https://openalex.org/C111350023","wikidata":"https://www.wikidata.org/wiki/Q1191869","display_name":"Markov chain Monte Carlo","level":3,"score":0.6209053993225098},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6135230660438538},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.569407045841217},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.5623760223388672},{"id":"https://openalex.org/C180384323","wikidata":"https://www.wikidata.org/wiki/Q16335137","display_name":"Alignment-free sequence analysis","level":5,"score":0.5485251545906067},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.546933114528656},{"id":"https://openalex.org/C119054055","wikidata":"https://www.wikidata.org/wiki/Q1576681","display_name":"Indel","level":5,"score":0.4594053328037262},{"id":"https://openalex.org/C4668613","wikidata":"https://www.wikidata.org/wiki/Q4116110","display_name":"Structural alignment","level":5,"score":0.44709107279777527},{"id":"https://openalex.org/C169214877","wikidata":"https://www.wikidata.org/wiki/Q981016","display_name":"Dirichlet distribution","level":3,"score":0.44559550285339355},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.42771345376968384},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.40884366631507874},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3506205081939697},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3145331144332886},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2621609568595886},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2264626920223236},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.20582666993141174},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.13203269243240356},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.12987565994262695},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C182310444","wikidata":"https://www.wikidata.org/wiki/Q1332643","display_name":"Boundary value problem","level":2,"score":0.0},{"id":"https://openalex.org/C153209595","wikidata":"https://www.wikidata.org/wiki/Q501128","display_name":"Single-nucleotide polymorphism","level":4,"score":0.0},{"id":"https://openalex.org/C135763542","wikidata":"https://www.wikidata.org/wiki/Q106016","display_name":"Genotype","level":3,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001499","descriptor_name":"Bayes Theorem","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001499","descriptor_name":"Bayes Theorem","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001499","descriptor_name":"Bayes Theorem","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001499","descriptor_name":"Bayes Theorem","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009010","descriptor_name":"Monte Carlo Method","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009010","descriptor_name":"Monte Carlo Method","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009010","descriptor_name":"Monte Carlo Method","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009010","descriptor_name":"Monte Carlo Method","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000592","qualifier_name":"standards","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000592","qualifier_name":"standards","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000592","qualifier_name":"standards","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000592","qualifier_name":"standards","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":6,"locations":[{"id":"doi:10.1371/journal.pcbi.1004936","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1004936","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1004936&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},{"id":"pmid:27192614","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/27192614","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:RePEc:plo:pcbi00:1004936","is_oa":false,"landing_page_url":"https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1004936","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:doaj.org/article:72b8929ae7bd4ddea360307582e69265","is_oa":true,"landing_page_url":"https://doaj.org/article/72b8929ae7bd4ddea360307582e69265","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 12, Iss 5, p e1004936 (2016)","raw_type":"article"},{"id":"pmh:oai:figshare.com:article/3389968","is_oa":true,"landing_page_url":"https://figshare.com/articles/dataset/Bayesian_Top-Down_Protein_Sequence_Alignment_with_Inferred_Position-Specific_Gap_Penalties/3389968","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dataset"},{"id":"pmh:oai:pubmedcentral.nih.gov:4871425","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/4871425","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Comput Biol","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1004936","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1004936","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1004936&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5099999904632568,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2402064298.pdf","grobid_xml":"https://content.openalex.org/works/W2402064298.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1519266993","https://openalex.org/W1574109141","https://openalex.org/W1590240800","https://openalex.org/W1969153299","https://openalex.org/W1970999032","https://openalex.org/W1980557641","https://openalex.org/W1986014242","https://openalex.org/W2006438342","https://openalex.org/W2024060531","https://openalex.org/W2036295979","https://openalex.org/W2038862069","https://openalex.org/W2045312812","https://openalex.org/W2056251063","https://openalex.org/W2066167693","https://openalex.org/W2067117360","https://openalex.org/W2069739265","https://openalex.org/W2077013196","https://openalex.org/W2101460669","https://openalex.org/W2105428289","https://openalex.org/W2109497857","https://openalex.org/W2115394533","https://openalex.org/W2122665495","https://openalex.org/W2127322768","https://openalex.org/W2127520112","https://openalex.org/W2127774996","https://openalex.org/W2132926880","https://openalex.org/W2134043769","https://openalex.org/W2136570298","https://openalex.org/W2151831732","https://openalex.org/W2153544371","https://openalex.org/W2160378127","https://openalex.org/W2170831688","https://openalex.org/W2189955651","https://openalex.org/W2330406605","https://openalex.org/W2418868888","https://openalex.org/W2431006159","https://openalex.org/W4252684946"],"related_works":["https://openalex.org/W2051969447","https://openalex.org/W2111937814","https://openalex.org/W2029514038","https://openalex.org/W2141411672","https://openalex.org/W2133116680","https://openalex.org/W1482324242","https://openalex.org/W2468116983","https://openalex.org/W2088487249","https://openalex.org/W187239587","https://openalex.org/W2158700816"],"abstract_inverted_index":{"We":[0],"describe":[1],"a":[2,55,59,132,183,248,256,267,272],"Bayesian":[3,133],"Markov":[4],"chain":[5],"Monte":[6],"Carlo":[7],"(MCMC)":[8],"sampler":[9],"for":[10,185,193,203],"protein":[11,217],"multiple":[12],"sequence":[13,97,154],"alignment":[14,99,137,187,252],"(MSA)":[15],"that,":[16],"as":[17,122],"implemented":[18],"in":[19,81,101,106,238],"the":[20,35,72,111,125,141,166,197,239],"program":[21,282],"GISMO":[22,46,152,254,281],"and":[23,42,75,146,245,265],"applied":[24],"to":[25,48,227,250],"large":[26],"numbers":[27],"of":[28,45,113,136,199,241,276],"diverse":[29,274],"sequences,":[30,74],"is":[31,161,213,283],"more":[32,204],"accurate":[33],"than":[34,259],"popular":[36],"MSA":[37,261],"programs":[38],"MUSCLE,":[39],"MAFFT,":[40],"Clustal-\u03a9":[41],"Kalign.":[43],"Features":[44],"central":[47],"its":[49],"performance":[50,212],"are:":[51],"(i)":[52],"It":[53,84,130,181],"employs":[54],"\"top-down\"":[56],"strategy":[57],"with":[58],"favorable":[60],"asymptotic":[61],"time":[62],"complexity":[63],"that":[64,89,189],"first":[65],"identifies":[66],"regions":[67,155],"generally":[68],"shared":[69],"by":[70],"all":[71],"input":[73],"then":[76],"realigns":[77],"closely":[78],"related":[79],"subgroups":[80],"tandem.":[82],"(ii)":[83],"infers":[85],"position-specific":[86],"gap":[87],"penalties":[88],"favor":[90],"insertions":[91,114],"or":[92],"deletions":[93],"(indels)":[94],"within":[95,271],"each":[96],"at":[98,285],"positions":[100],"which":[102,118,175,233],"indels":[103],"are":[104],"invoked":[105],"other":[107,260],"sequences.":[108,179,223,279],"This":[109,160],"favors":[110],"placement":[112],"between":[115],"conserved":[116,268],"blocks,":[117],"can":[119],"be":[120],"understood":[121],"making":[123],"up":[124],"proteins'":[126],"structural":[127],"core.":[128],"(iii)":[129],"uses":[131],"statistical":[134],"measure":[135],"quality":[138],"based":[139,164],"on":[140,147,165,220],"minimum":[142],"description":[143],"length":[144,278],"principle":[145],"Dirichlet":[148],"mixture":[149],"priors.":[150],"Consequently,":[151],"aligns":[153],"only":[156],"when":[157],"statistically":[158],"justified.":[159],"unlike":[162],"methods":[163],"ad":[167],"hoc,":[168],"but":[169],"widely":[170],"used,":[171],"sum-of-the-pairs":[172],"scoring":[173],"system,":[174],"will":[176],"align":[177],"random":[178],"(iv)":[180],"defines":[182],"system":[184],"exploring":[186],"space":[188],"provides":[190],"natural":[191],"avenues":[192],"further":[194],"experimentation":[195],"through":[196],"development":[198],"new":[200],"sampling":[201],"strategies":[202],"efficiently":[205],"escaping":[206],"from":[207],"suboptimal":[208],"traps.":[209],"GISMO's":[210],"superior":[211],"illustrated":[214],"using":[215],"408":[216],"sets":[218,225],"containing,":[219],"average,":[221],"235":[222],"These":[224],"correspond":[226],"NCBI":[228],"Conserved":[229],"Domain":[230],"Database":[231],"alignments,":[232],"have":[234],"been":[235],"manually":[236],"curated":[237],"light":[240],"available":[242,284],"crystal":[243],"structures,":[244],"thus":[246],"provide":[247],"means":[249],"assess":[251],"accuracy.":[253],"fills":[255],"different":[257],"niche":[258],"programs,":[262],"namely":[263],"identifying":[264],"aligning":[266],"domain":[269],"present":[270],"large,":[273],"set":[275],"full":[277],"The":[280],"http://gismo.igs.umaryland.edu/.":[286]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
