{"id":"https://openalex.org/W2605412425","doi":"https://doi.org/10.1186/s13015-017-0102-3","title":"Core column prediction for protein multiple sequence alignments","display_name":"Core column prediction for protein multiple sequence alignments","publication_year":2017,"publication_date":"2017-04-19","ids":{"openalex":"https://openalex.org/W2605412425","doi":"https://doi.org/10.1186/s13015-017-0102-3","mag":"2605412425","pmid":"https://pubmed.ncbi.nlm.nih.gov/28435440"},"language":"en","primary_location":{"id":"doi:10.1186/s13015-017-0102-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13015-017-0102-3","pdf_url":"https://almob.biomedcentral.com/track/pdf/10.1186/s13015-017-0102-3","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://almob.biomedcentral.com/track/pdf/10.1186/s13015-017-0102-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014004628","display_name":"Dan DeBlasio","orcid":"https://orcid.org/0000-0003-4110-4431"},"institutions":[{"id":"https://openalex.org/I138006243","display_name":"University of Arizona","ror":"https://ror.org/03m2x1q45","country_code":"US","type":"education","lineage":["https://openalex.org/I138006243"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dan DeBlasio","raw_affiliation_strings":["Computational Biology Department, Carnegie Mellon University, Pittsburgh, PA 15213 USA","Department of Computer Science, The University of Arizona, Tucson, AZ 85721 USA","Department of Computer Science, The University of Arizona, Tucson, AZ, 85721, USA"],"affiliations":[{"raw_affiliation_string":"Computational Biology Department, Carnegie Mellon University, Pittsburgh, PA 15213 USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Department of Computer Science, The University of Arizona, Tucson, AZ 85721 USA","institution_ids":["https://openalex.org/I138006243"]},{"raw_affiliation_string":"Department of Computer Science, The University of Arizona, Tucson, AZ, 85721, USA","institution_ids":["https://openalex.org/I138006243"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083998316","display_name":"John Kececioglu","orcid":"https://orcid.org/0000-0003-1204-6535"},"institutions":[{"id":"https://openalex.org/I138006243","display_name":"University of Arizona","ror":"https://ror.org/03m2x1q45","country_code":"US","type":"education","lineage":["https://openalex.org/I138006243"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John Kececioglu","raw_affiliation_strings":["Department of Computer Science, The University of Arizona, Tucson, AZ 85721 USA","Department of Computer Science, The University of Arizona, Tucson, AZ, 85721, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, The University of Arizona, Tucson, AZ 85721 USA","institution_ids":["https://openalex.org/I138006243"]},{"raw_affiliation_string":"Department of Computer Science, The University of Arizona, Tucson, AZ, 85721, USA","institution_ids":["https://openalex.org/I138006243"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5014004628"],"corresponding_institution_ids":["https://openalex.org/I138006243","https://openalex.org/I74973139"],"apc_list":{"value":1490,"currency":"GBP","value_usd":1827},"apc_paid":{"value":1490,"currency":"GBP","value_usd":1827},"fwci":0.1123,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49471017,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"12","issue":"1","first_page":"11","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10602","display_name":"Glycosylation and Glycoproteins Research","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/column","display_name":"Column (typography)","score":0.6646232008934021},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6614128351211548},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.6261221170425415},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5361933708190918},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4986405372619629},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.3296426832675934},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.1329006850719452},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.06875842809677124},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.06817123293876648}],"concepts":[{"id":"https://openalex.org/C2780551164","wikidata":"https://www.wikidata.org/wiki/Q2306599","display_name":"Column (typography)","level":3,"score":0.6646232008934021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6614128351211548},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.6261221170425415},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5361933708190918},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4986405372619629},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3296426832675934},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.1329006850719452},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.06875842809677124},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.06817123293876648},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1186/s13015-017-0102-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13015-017-0102-3","pdf_url":"https://almob.biomedcentral.com/track/pdf/10.1186/s13015-017-0102-3","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},{"id":"pmid:28435440","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/28435440","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for molecular biology : AMB","raw_type":null},{"id":"pmh:oai:repository.arizona.edu:10150/623957","is_oa":true,"landing_page_url":"http://hdl.handle.net/10150/623957","pdf_url":null,"source":{"id":"https://openalex.org/S4306400271","display_name":"UA Campus Repository (The University of Arizona)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I138006243","host_organization_name":"University of Arizona","host_organization_lineage":["https://openalex.org/I138006243"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:doaj.org/article:76f852add7e241a29b363ca308c4368d","is_oa":true,"landing_page_url":"https://doaj.org/article/76f852add7e241a29b363ca308c4368d","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms for Molecular Biology, Vol 12, Iss 1, Pp 1-16 (2017)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:5397798","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/5397798","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms Mol Biol","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13015-017-0102-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13015-017-0102-3","pdf_url":"https://almob.biomedcentral.com/track/pdf/10.1186/s13015-017-0102-3","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1325684988","display_name":null,"funder_award_id":"CCF-1256087","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2375335175","display_name":null,"funder_award_id":"IIS-1217886","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3068176952","display_name":null,"funder_award_id":"R01HG007104","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G3355402586","display_name":null,"funder_award_id":"GBMF4554","funder_id":"https://openalex.org/F4320306202","funder_display_name":"Gordon and Betty Moore Foundation"},{"id":"https://openalex.org/G3641969089","display_name":null,"funder_award_id":"1256087","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6569375368","display_name":null,"funder_award_id":"HG007104","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G7981293496","display_name":null,"funder_award_id":"IIS-1217886","funder_id":"https://openalex.org/F4320337389","funder_display_name":"Division of Information and Intelligent Systems"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306202","display_name":"Gordon and Betty Moore Foundation","ror":"https://ror.org/006wxqw41"},{"id":"https://openalex.org/F4320310160","display_name":"University of Arizona","ror":"https://ror.org/03m2x1q45"},{"id":"https://openalex.org/F4320310207","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320337389","display_name":"Division of Information and Intelligent Systems","ror":"https://ror.org/053a2cp42"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2605412425.pdf","grobid_xml":"https://content.openalex.org/works/W2605412425.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W171034855","https://openalex.org/W1519266993","https://openalex.org/W1963957860","https://openalex.org/W1993414412","https://openalex.org/W2007924998","https://openalex.org/W2009570821","https://openalex.org/W2021883973","https://openalex.org/W2035594133","https://openalex.org/W2074830661","https://openalex.org/W2075451741","https://openalex.org/W2102502076","https://openalex.org/W2106053110","https://openalex.org/W2110919845","https://openalex.org/W2114320077","https://openalex.org/W2114616367","https://openalex.org/W2115888213","https://openalex.org/W2127322768","https://openalex.org/W2127556561","https://openalex.org/W2130625618","https://openalex.org/W2133296809","https://openalex.org/W2140890018","https://openalex.org/W2143210482","https://openalex.org/W2146712012","https://openalex.org/W2149956330","https://openalex.org/W2153187042","https://openalex.org/W2154952425","https://openalex.org/W2493400422","https://openalex.org/W2523931589","https://openalex.org/W2776985701","https://openalex.org/W4245668478","https://openalex.org/W4285719527","https://openalex.org/W4300568064"],"related_works":["https://openalex.org/W2181722423","https://openalex.org/W2347222412","https://openalex.org/W2085601491","https://openalex.org/W2375996887","https://openalex.org/W4322723290","https://openalex.org/W2368976073","https://openalex.org/W2376548177","https://openalex.org/W2808994565","https://openalex.org/W2769449614","https://openalex.org/W1956179383"],"abstract_inverted_index":{"We":[0,81,112],"develop":[1],"for":[2,11,95,115],"the":[3,33,89,126],"first":[4],"time":[5],"a":[6,24,55,59,70,76,102,107,130],"<i>predictor</i>":[7],"of":[8,23,91,106,110],"column":[9],"coreness":[10,40,56,84],"protein":[12],"multiple":[13],"sequence":[14],"alignments.":[15],"This":[16],"allows":[17],"us":[18],"to":[19,38,43,86,100],"predict":[20],"which":[21],"columns":[22],"computed":[25],"alignment":[26,105,134],"are":[27],"core,":[28],"and":[29,62,128],"hence":[30],"better":[31],"estimate":[32],"alignment's":[34],"accuracy.":[35,135],"Our":[36],"approach":[37],"predicting":[39],"is":[41],"similar":[42],"nearest-neighbor":[44,52],"classification":[45],"from":[46,125],"machine":[47],"learning,":[48],"except":[49],"we":[50,63],"transform":[51],"distances":[53],"into":[54],"prediction":[57],"via":[58],"regression":[60],"function,":[61],"learn":[64],"an":[65,96],"appropriate":[66],"distance":[67],"function":[68,99],"through":[69],"new":[71],"optimization":[72],"formulation":[73],"that":[74,114],"solves":[75],"large-scale":[77],"linear":[78],"programming":[79],"problem.":[80],"apply":[82],"our":[83,118],"predictor":[85,119],"<i>parameter":[87],"advising</i>,":[88],"task":[90],"choosing":[92],"parameter":[93],"values":[94],"aligner's":[97],"scoring":[98],"obtain":[101],"more":[103],"accurate":[104],"specific":[108],"set":[109],"sequences.":[111],"show":[113],"this":[116],"task,":[117],"strongly":[120],"outperforms":[121],"other":[122],"column-confidence":[123],"estimators":[124],"literature,":[127],"affords":[129],"substantial":[131],"boost":[132],"in":[133]},"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
