{"id":"https://openalex.org/W2161880345","doi":"https://doi.org/10.1093/database/bat023","title":"The challenge of increasing Pfam coverage of the human proteome","display_name":"The challenge of increasing Pfam coverage of the human proteome","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W2161880345","doi":"https://doi.org/10.1093/database/bat023","mag":"2161880345","pmid":"https://pubmed.ncbi.nlm.nih.gov/23603847"},"language":"en","primary_location":{"id":"doi:10.1093/database/bat023","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat023","pdf_url":"https://academic.oup.com/database/article-pdf/doi/10.1093/database/bat023/11196772/bat023.pdf","source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://academic.oup.com/database/article-pdf/doi/10.1093/database/bat023/11196772/bat023.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024885643","display_name":"Jaina Mistry","orcid":"https://orcid.org/0000-0003-2479-5322"},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Jaina Mistry","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079459718","display_name":"Penny Coggill","orcid":null},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Penny Coggill","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040135675","display_name":"Ruth Y. Eberhardt","orcid":"https://orcid.org/0000-0001-6152-1369"},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ruth Y. Eberhardt","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048095929","display_name":"Antonio Deiana","orcid":null},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Antonio Deiana","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090645044","display_name":"Andrea Giansanti","orcid":"https://orcid.org/0000-0002-8113-8188"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrea Giansanti","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104045098","display_name":"ROBERT FINN","orcid":"https://orcid.org/0000-0001-8626-2148"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robert D. Finn","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059430118","display_name":"Alex Bateman","orcid":null},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alex Bateman","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056369160","display_name":"Marco Punta","orcid":"https://orcid.org/0000-0002-0050-0676"},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marco Punta","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5024885643"],"corresponding_institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"],"apc_list":{"value":1415,"currency":"GBP","value_usd":1735},"apc_paid":{"value":1415,"currency":"GBP","value_usd":1735},"fwci":1.8832,"has_fulltext":true,"cited_by_count":31,"citation_normalized_percentile":{"value":0.84044301,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"2013","issue":null,"first_page":"bat023","last_page":"bat023"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/uniprot","display_name":"UniProt","score":0.9073106050491333},{"id":"https://openalex.org/keywords/human-proteome-project","display_name":"Human proteome project","score":0.7410255670547485},{"id":"https://openalex.org/keywords/proteome","display_name":"Proteome","score":0.6985630393028259},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5267757177352905},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.5156668424606323},{"id":"https://openalex.org/keywords/proteomics","display_name":"Proteomics","score":0.33272844552993774},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.2921689450740814},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.24397563934326172}],"concepts":[{"id":"https://openalex.org/C202264299","wikidata":"https://www.wikidata.org/wiki/Q905695","display_name":"UniProt","level":3,"score":0.9073106050491333},{"id":"https://openalex.org/C94795543","wikidata":"https://www.wikidata.org/wiki/Q3813754","display_name":"Human proteome project","level":4,"score":0.7410255670547485},{"id":"https://openalex.org/C104397665","wikidata":"https://www.wikidata.org/wiki/Q860947","display_name":"Proteome","level":2,"score":0.6985630393028259},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5267757177352905},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.5156668424606323},{"id":"https://openalex.org/C46111723","wikidata":"https://www.wikidata.org/wiki/Q471857","display_name":"Proteomics","level":3,"score":0.33272844552993774},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.2921689450740814},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.24397563934326172},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D004926","descriptor_name":"Escherichia coli","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004926","descriptor_name":"Escherichia coli","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004926","descriptor_name":"Escherichia coli","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D004926","descriptor_name":"Escherichia coli","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012441","descriptor_name":"Saccharomyces cerevisiae","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012441","descriptor_name":"Saccharomyces cerevisiae","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012441","descriptor_name":"Saccharomyces cerevisiae","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012441","descriptor_name":"Saccharomyces cerevisiae","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017434","descriptor_name":"Protein Structure, Tertiary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017434","descriptor_name":"Protein Structure, Tertiary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017434","descriptor_name":"Protein Structure, Tertiary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017434","descriptor_name":"Protein Structure, Tertiary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020543","descriptor_name":"Proteome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020543","descriptor_name":"Proteome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020543","descriptor_name":"Proteome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020543","descriptor_name":"Proteome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":4,"locations":[{"id":"doi:10.1093/database/bat023","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat023","pdf_url":"https://academic.oup.com/database/article-pdf/doi/10.1093/database/bat023/11196772/bat023.pdf","source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},{"id":"pmid:23603847","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/23603847","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database : the journal of biological databases and curation","raw_type":null},{"id":"pmh:oai:europepmc.org:2628430","is_oa":false,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3630804","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:iris.uniroma1.it:11573/515923","is_oa":false,"landing_page_url":"http://hdl.handle.net/11573/515923","pdf_url":null,"source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1093/database/bat023","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat023","pdf_url":"https://academic.oup.com/database/article-pdf/doi/10.1093/database/bat023/11196772/bat023.pdf","source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.47999998927116394,"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land"}],"awards":[{"id":"https://openalex.org/G6955215639","display_name":null,"funder_award_id":"BB/F010435/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"},{"id":"https://openalex.org/G8039298099","display_name":"Embracing new technologies to streamline improve and sustain InterPro and its contributing databases","funder_award_id":"BB/F010435/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320311904","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08"},{"id":"https://openalex.org/F4320320360","display_name":"University of Bristol","ror":"https://ror.org/0524sp257"},{"id":"https://openalex.org/F4320334629","display_name":"Biotechnology and Biological Sciences Research Council","ror":"https://ror.org/00cwqg982"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2161880345.pdf","grobid_xml":"https://content.openalex.org/works/W2161880345.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1513332069","https://openalex.org/W1578400757","https://openalex.org/W1892578325","https://openalex.org/W1968697272","https://openalex.org/W1971147414","https://openalex.org/W1971943180","https://openalex.org/W1991906934","https://openalex.org/W1998112339","https://openalex.org/W2013743057","https://openalex.org/W2022366078","https://openalex.org/W2026271132","https://openalex.org/W2051119339","https://openalex.org/W2057071212","https://openalex.org/W2059324308","https://openalex.org/W2070496155","https://openalex.org/W2085656056","https://openalex.org/W2092754163","https://openalex.org/W2096096221","https://openalex.org/W2099946731","https://openalex.org/W2102221598","https://openalex.org/W2107040871","https://openalex.org/W2107644675","https://openalex.org/W2110976912","https://openalex.org/W2124166542","https://openalex.org/W2128653811","https://openalex.org/W2132720084","https://openalex.org/W2134024910","https://openalex.org/W2139915240","https://openalex.org/W2141885858","https://openalex.org/W2144252381","https://openalex.org/W2146637813","https://openalex.org/W2158133029","https://openalex.org/W2161199282","https://openalex.org/W2163603537","https://openalex.org/W2168909179","https://openalex.org/W2170563234","https://openalex.org/W2259938310","https://openalex.org/W2519244818","https://openalex.org/W4210623056","https://openalex.org/W4320301318"],"related_works":["https://openalex.org/W2730490632","https://openalex.org/W2090672107","https://openalex.org/W1975345997","https://openalex.org/W1578833252","https://openalex.org/W4306353170","https://openalex.org/W2055310317","https://openalex.org/W267074739","https://openalex.org/W3157596112","https://openalex.org/W3195891740","https://openalex.org/W2885660763"],"abstract_inverted_index":{"It":[0],"is":[1],"a":[2,67,229,243],"worthy":[3],"goal":[4],"to":[5,84,119,144,184,200,203,256],"completely":[6],"characterize":[7],"all":[8],"human":[9,38,52,92,115,139,252],"proteins":[10,35,131],"in":[11,28,36,99,132,176,213],"terms":[12],"of":[13,34,44,90,113,146,159,165,179,195,250,260],"their":[14,233],"domains.":[15],"Here,":[16],"using":[17],"the":[18,37,91,114,133,138,168,220,251,258],"Pfam":[19,100,237,248],"database,":[20],"we":[21,25],"asked":[22],"how":[23],"far":[24],"have":[26,272],"progressed":[27],"this":[29],"endeavour.":[30],"Ninety":[31],"per":[32,163],"cent":[33,164],"proteome":[39,116,253],"matched":[40,171],"at":[41],"least":[42],"one":[43,221],"5494":[45],"manually":[46],"curated":[47],"Pfam-A":[48,56,190],"families.":[49,161,238,262],"In":[50],"contrast,":[51],"residue":[53],"coverage":[54,249],"by":[55],"families":[57,65,197,264],"was":[58,96,117],"<45%,":[59],"with":[60,106,130,188,223],"9418":[61],"automatically":[62],"generated":[63,202],"Pfam-B":[64],"adding":[66],"further":[68],"10%.":[69],"Even":[70],"after":[71],"excluding":[72],"predicted":[73],"signal":[74],"peptide":[75],"regions":[76,79,140,209],"and":[77,103],"short":[78],"(<50":[80],"consecutive":[81],"residues)":[82],"unlikely":[83],"harbour":[85],"new":[86,196,236],"families,":[87,191],"for":[88,246],"\u223c38%":[89],"protein":[93,108,127],"residues,":[94],"there":[95],"no":[97],"information":[98],"about":[101],"conservation":[102],"evolutionary":[104],"relationship":[105,187],"other":[107,147,169],"regions.":[109,128],"This":[110,226],"uncovered":[111],"portion":[112],"found":[118],"be":[120,201,255,267],"distributed":[121],"over":[122],"almost":[123],"25":[124],"000":[125],"distinct":[126],"Comparison":[129],"UniProtKB":[134],"database":[135],"suggested":[136],"that":[137,141,193,271],"exhibited":[142],"similarity":[143],"thousands":[145,194],"sequences":[148,175],"were":[149,210],"often":[150],"either":[151],"divergent":[152],"elements":[153],"or":[154,156],"N-":[155],"C-terminal":[157],"extensions":[158],"existing":[160,189,261],"Thirty-four":[162],"regions,":[166],"on":[167,240],"hand,":[170],"fewer":[172],"than":[173],"100":[174],"UniProtKB.":[177],"Most":[178],"these":[180,207,241],"did":[181],"not":[182],"appear":[183],"share":[185],"any":[186],"suggesting":[192],"would":[198],"need":[199],"cover":[204],"them.":[205],"Also,":[206],"latter":[208],"particularly":[211],"rich":[212],"amino":[214],"acid":[215],"compositional":[216],"bias":[217],"such":[218],"as":[219],"associated":[222],"intrinsic":[224],"disorder.":[225],"could":[227],"represent":[228],"significant":[230],"obstacle":[231],"toward":[232],"inclusion":[234],"into":[235],"Based":[239],"observations,":[242],"major":[244],"focus":[245],"increasing":[247],"will":[254,265],"improve":[257],"definition":[259],"New":[263],"also":[266],"built,":[268],"prioritizing":[269],"those":[270],"been":[273],"experimentally":[274],"functionally":[275],"characterized.":[276],"Database":[277],"URL:":[278],"http://pfam.sanger.ac.uk/":[279]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
