{"id":"https://openalex.org/W2060797027","doi":"https://doi.org/10.1371/journal.pcbi.1000605","title":"Annotation Error in Public Databases: Misannotation of Molecular Function in Enzyme Superfamilies","display_name":"Annotation Error in Public Databases: Misannotation of Molecular Function in Enzyme Superfamilies","publication_year":2009,"publication_date":"2009-12-10","ids":{"openalex":"https://openalex.org/W2060797027","doi":"https://doi.org/10.1371/journal.pcbi.1000605","mag":"2060797027","pmid":"https://pubmed.ncbi.nlm.nih.gov/20011109"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1000605","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1000605","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1000605&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1000605&type=printable","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017236112","display_name":"Alexandra M. Schnoes","orcid":"https://orcid.org/0000-0003-2727-7758"},"institutions":[{"id":"https://openalex.org/I180670191","display_name":"University of California, San Francisco","ror":"https://ror.org/043mz5j54","country_code":"US","type":"education","lineage":["https://openalex.org/I180670191"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexandra M. Schnoes","raw_affiliation_strings":["Graduate Group in Biophysics, University of California San Francisco, San Francisco, California, United States of America"],"affiliations":[{"raw_affiliation_string":"Graduate Group in Biophysics, University of California San Francisco, San Francisco, California, United States of America","institution_ids":["https://openalex.org/I180670191"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111814314","display_name":"Shoshana Brown","orcid":null},"institutions":[{"id":"https://openalex.org/I180670191","display_name":"University of California, San Francisco","ror":"https://ror.org/043mz5j54","country_code":"US","type":"education","lineage":["https://openalex.org/I180670191"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shoshana D. Brown","raw_affiliation_strings":["Department of Bioengineering and Therapeutic Sciences, University of California San Francisco, San Francisco, California, United States of America"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering and Therapeutic Sciences, University of California San Francisco, San Francisco, California, United States of America","institution_ids":["https://openalex.org/I180670191"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090448729","display_name":"Igor Dodevski","orcid":null},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Igor Dodevski","raw_affiliation_strings":["Department of Biochemistry, University of Z\u00fcrich, Z\u00fcrich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Department of Biochemistry, University of Z\u00fcrich, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I202697423"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020002876","display_name":"Patricia C. Babbitt","orcid":"https://orcid.org/0000-0003-0375-9015"},"institutions":[{"id":"https://openalex.org/I103922791","display_name":"QB3","ror":"https://ror.org/04n1n3n22","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I103922791","https://openalex.org/I180670191","https://openalex.org/I185103710","https://openalex.org/I95457486"]},{"id":"https://openalex.org/I180670191","display_name":"University of California, San Francisco","ror":"https://ror.org/043mz5j54","country_code":"US","type":"education","lineage":["https://openalex.org/I180670191"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Patricia C. Babbitt","raw_affiliation_strings":["California Institute for Quantitative Biosciences, University of California San Francisco, San Francisco, California, United States of America","Department of Bioengineering and Therapeutic Sciences, University of California San Francisco, San Francisco, California, United States of America","Department of Pharmaceutical Chemistry, University of California San Francisco, San Francisco, California, United States of America"],"affiliations":[{"raw_affiliation_string":"California Institute for Quantitative Biosciences, University of California San Francisco, San Francisco, California, United States of America","institution_ids":["https://openalex.org/I103922791","https://openalex.org/I180670191"]},{"raw_affiliation_string":"Department of Bioengineering and Therapeutic Sciences, University of California San Francisco, San Francisco, California, United States of America","institution_ids":["https://openalex.org/I180670191"]},{"raw_affiliation_string":"Department of Pharmaceutical Chemistry, University of California San Francisco, San Francisco, California, United States of America","institution_ids":["https://openalex.org/I180670191"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020002876"],"corresponding_institution_ids":["https://openalex.org/I103922791","https://openalex.org/I180670191"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":2655,"currency":"USD","value_usd":2655},"fwci":14.4233,"has_fulltext":true,"cited_by_count":705,"citation_normalized_percentile":{"value":0.99394445,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"5","issue":"12","first_page":"e1000605","last_page":"e1000605"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/uniprot","display_name":"UniProt","score":0.9649074077606201},{"id":"https://openalex.org/keywords/genbank","display_name":"GenBank","score":0.8309332132339478},{"id":"https://openalex.org/keywords/kegg","display_name":"KEGG","score":0.8193983435630798},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6908634901046753},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5867945551872253},{"id":"https://openalex.org/keywords/sequence-database","display_name":"Sequence database","score":0.5094934105873108},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.4946150481700897},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.48981139063835144},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.48528286814689636},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.473283976316452},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4127046763896942},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.3033648729324341},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.2714710235595703},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2380758821964264},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.18489250540733337},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.16558033227920532},{"id":"https://openalex.org/keywords/gene-ontology","display_name":"Gene ontology","score":0.08639472723007202}],"concepts":[{"id":"https://openalex.org/C202264299","wikidata":"https://www.wikidata.org/wiki/Q905695","display_name":"UniProt","level":3,"score":0.9649074077606201},{"id":"https://openalex.org/C79029880","wikidata":"https://www.wikidata.org/wiki/Q901755","display_name":"GenBank","level":3,"score":0.8309332132339478},{"id":"https://openalex.org/C152724338","wikidata":"https://www.wikidata.org/wiki/Q909442","display_name":"KEGG","level":5,"score":0.8193983435630798},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6908634901046753},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5867945551872253},{"id":"https://openalex.org/C41584329","wikidata":"https://www.wikidata.org/wiki/Q175902","display_name":"Sequence database","level":3,"score":0.5094934105873108},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4946150481700897},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.48981139063835144},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.48528286814689636},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.473283976316452},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4127046763896942},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.3033648729324341},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.2714710235595703},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2380758821964264},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.18489250540733337},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.16558033227920532},{"id":"https://openalex.org/C2987395477","wikidata":"https://www.wikidata.org/wiki/Q135085","display_name":"Gene ontology","level":4,"score":0.08639472723007202},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0}],"mesh":[{"descriptor_ui":"D003628","descriptor_name":"Database Management Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003628","descriptor_name":"Database Management Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003628","descriptor_name":"Database Management Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003628","descriptor_name":"Database Management Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055162","descriptor_name":"Biocatalysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055162","descriptor_name":"Biocatalysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055162","descriptor_name":"Biocatalysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055162","descriptor_name":"Biocatalysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":6,"locations":[{"id":"doi:10.1371/journal.pcbi.1000605","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1000605","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1000605&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS Computational Biology","raw_type":"journal-article"},{"id":"pmid:20011109","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/20011109","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:RePEc:plo:pcbi00:1000605","is_oa":false,"landing_page_url":"https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1000605","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:doaj.org/article:d399fec6c83b4f6a983821429be3ec92","is_oa":true,"landing_page_url":"https://doaj.org/article/d399fec6c83b4f6a983821429be3ec92","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 5, Iss 12, p e1000605 (2009)","raw_type":"article"},{"id":"pmh:oai:figshare.com:article/145406","is_oa":true,"landing_page_url":"https://figshare.com/articles/Annotation_Error_in_Public_Databases_Misannotation_of_Molecular_Function_in_Enzyme_Superfamilies/145406","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dataset"},{"id":"pmh:oai:pubmedcentral.nih.gov:2781113","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2781113","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Comput Biol","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1000605","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1000605","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1000605&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5699999928474426,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[{"id":"https://openalex.org/G5990478676","display_name":null,"funder_award_id":"GM071790","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G6894402473","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G874721465","display_name":null,"funder_award_id":"GM60595","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2060797027.pdf","grobid_xml":"https://content.openalex.org/works/W2060797027.grobid-xml"},"referenced_works_count":75,"referenced_works":["https://openalex.org/W130193107","https://openalex.org/W217834111","https://openalex.org/W1507593999","https://openalex.org/W1509280691","https://openalex.org/W1575826900","https://openalex.org/W1700503930","https://openalex.org/W1841334989","https://openalex.org/W1964640688","https://openalex.org/W1965144037","https://openalex.org/W1972314084","https://openalex.org/W1973626596","https://openalex.org/W1975914194","https://openalex.org/W1977027195","https://openalex.org/W1982481323","https://openalex.org/W1988818490","https://openalex.org/W1994441981","https://openalex.org/W1995047912","https://openalex.org/W1995117714","https://openalex.org/W1995413875","https://openalex.org/W1996351562","https://openalex.org/W2003788979","https://openalex.org/W2011025549","https://openalex.org/W2032838501","https://openalex.org/W2048947602","https://openalex.org/W2055033601","https://openalex.org/W2057387739","https://openalex.org/W2057885377","https://openalex.org/W2063597580","https://openalex.org/W2072854916","https://openalex.org/W2086803538","https://openalex.org/W2093407117","https://openalex.org/W2100320834","https://openalex.org/W2101641168","https://openalex.org/W2103017472","https://openalex.org/W2107251251","https://openalex.org/W2107424557","https://openalex.org/W2109615707","https://openalex.org/W2109715166","https://openalex.org/W2112492958","https://openalex.org/W2113561798","https://openalex.org/W2115595474","https://openalex.org/W2116258825","https://openalex.org/W2116423958","https://openalex.org/W2120423098","https://openalex.org/W2123060905","https://openalex.org/W2124200821","https://openalex.org/W2124410686","https://openalex.org/W2126178176","https://openalex.org/W2130406589","https://openalex.org/W2132926880","https://openalex.org/W2133787379","https://openalex.org/W2135152200","https://openalex.org/W2136514583","https://openalex.org/W2140377922","https://openalex.org/W2141885858","https://openalex.org/W2146188580","https://openalex.org/W2148130205","https://openalex.org/W2155606054","https://openalex.org/W2157142163","https://openalex.org/W2158714788","https://openalex.org/W2159675211","https://openalex.org/W2161062388","https://openalex.org/W2161794223","https://openalex.org/W2163105490","https://openalex.org/W2166745327","https://openalex.org/W2167455933","https://openalex.org/W2168909179","https://openalex.org/W2604823638","https://openalex.org/W2951726307","https://openalex.org/W2991064287","https://openalex.org/W4210323379","https://openalex.org/W4211000692","https://openalex.org/W4212865600","https://openalex.org/W4252706339","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2506632566","https://openalex.org/W2161189461","https://openalex.org/W2022667872","https://openalex.org/W4213149192","https://openalex.org/W2161062388","https://openalex.org/W2003144438","https://openalex.org/W2762751282","https://openalex.org/W1982597966","https://openalex.org/W2006673229","https://openalex.org/W1972394537"],"abstract_inverted_index":{"Due":[0],"to":[1,103,177,231],"the":[2,12,37,58,97,108,119,123,139,146,150,165,227],"rapid":[3],"release":[4],"of":[5,14,34,39,80,133,145,152,158,164,181,194,226,235],"new":[6],"data":[7],"from":[8,175],"genome":[9],"sequencing":[10],"projects,":[11],"majority":[13],"protein":[15,67,111,120],"sequences":[16,26,121],"in":[17,41,53,64,122,154,202],"public":[18,43,66],"databases":[19,44,69,113,160],"have":[20,49,56],"not":[21,50],"been":[22,51,218],"experimentally":[23],"characterized;":[24],"rather,":[25],"are":[27,45,221],"annotated":[28],"using":[29],"computational":[30],"analysis.":[31],"The":[32,91,179],"level":[33,151],"misannotation":[35,40,59,134,153,172,182,201],"and":[36,48,74,116,118,129],"types":[38,180],"large":[42],"currently":[46],"unknown":[47],"analyzed":[52],"depth.":[54],"We":[55],"investigated":[57],"levels":[60,101,132,234],"for":[61,76,84,105,223],"molecular":[62,195],"function":[63],"four":[65],"sequence":[68,112],"(UniProtKB/Swiss-Prot,":[70],"GenBank":[71],"NR,":[72],"UniProtKB/TrEMBL,":[73],"KEGG)":[75],"a":[77,213],"model":[78],"set":[79],"37":[81,147],"enzyme":[82,203],"families":[83,148,207],"which":[85],"extensive":[86],"experimental":[87],"information":[88],"is":[89,161,212],"available.":[90],"manually":[92],"curated":[93],"database":[94,126,167],"Swiss-Prot":[95],"shows":[96,170],"lowest":[98],"annotation":[99],"error":[100],"(close":[102],"0%":[104],"most":[106,190],"families);":[107],"two":[109],"other":[110],"(GenBank":[114],"NR":[115,166],"TrEMBL)":[117],"KEGG":[124],"pathways":[125],"exhibit":[127],"similar":[128],"surprisingly":[130],"high":[131,233],"that":[135,171,183,200,208],"average":[136],"5%-63%":[137],"across":[138],"six":[140],"superfamilies":[141,204],"studied.":[142],"For":[143],"10":[144],"examined,":[149],"one":[155],"or":[156],"more":[157],"these":[159,232],">80%.":[162],"Examination":[163],"over":[168],"time":[169],"has":[173,217],"increased":[174],"1993":[176],"2005.":[178],"were":[184],"found":[185],"fall":[186],"into":[187],"several":[188],"categories,":[189],"associated":[191],"with":[192],"\"overprediction\"":[193],"function.":[196],"These":[197],"results":[198],"suggest":[199],"containing":[205],"multiple":[206],"catalyze":[209],"different":[210],"reactions":[211],"larger":[214],"problem":[215],"than":[216],"recognized.":[219],"Strategies":[220],"suggested":[222],"addressing":[224],"some":[225],"systematic":[228],"problems":[229],"contributing":[230],"misannotation.":[236]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":28},{"year":2024,"cited_by_count":42},{"year":2023,"cited_by_count":28},{"year":2022,"cited_by_count":42},{"year":2021,"cited_by_count":32},{"year":2020,"cited_by_count":54},{"year":2019,"cited_by_count":56},{"year":2018,"cited_by_count":47},{"year":2017,"cited_by_count":62},{"year":2016,"cited_by_count":37},{"year":2015,"cited_by_count":42},{"year":2014,"cited_by_count":58},{"year":2013,"cited_by_count":61},{"year":2012,"cited_by_count":42}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
