{"id":"https://openalex.org/W4232697233","doi":"https://doi.org/10.1093/database/bat040","title":"The challenge of increasing Pfam coverage of the human proteome","display_name":"The challenge of increasing Pfam coverage of the human proteome","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W4232697233","doi":"https://doi.org/10.1093/database/bat040"},"language":"en","primary_location":{"id":"doi:10.1093/database/bat040","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat040","pdf_url":null,"source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1093/database/bat040","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024885643","display_name":"Jaina Mistry","orcid":"https://orcid.org/0000-0003-2479-5322"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jaina Mistry","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079459718","display_name":"Penny Coggill","orcid":null},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Penny Coggill","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040135675","display_name":"Ruth Y. Eberhardt","orcid":"https://orcid.org/0000-0001-6152-1369"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ruth Y. Eberhardt","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048095929","display_name":"Antonio Deiana","orcid":null},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Antonio Deiana","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090645044","display_name":"Andrea Giansanti","orcid":"https://orcid.org/0000-0002-8113-8188"},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrea Giansanti","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104045098","display_name":"ROBERT FINN","orcid":"https://orcid.org/0000-0001-8626-2148"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Robert D. Finn","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059430118","display_name":"Alex Bateman","orcid":null},"institutions":[{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]},{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alex Bateman","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056369160","display_name":"Marco Punta","orcid":"https://orcid.org/0000-0002-0050-0676"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I87048295","display_name":"Wellcome Trust","ror":"https://ror.org/029chgv08","country_code":"GB","type":"funder","lineage":["https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Marco Punta","raw_affiliation_strings":["EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA"],"affiliations":[{"raw_affiliation_string":"EMBL-European Bioinformatics Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SD, UK, 2Sanger Institute, Wellcome Trust Genome Campus, Hinxton, Cambridge, CB10 1SA, UK, 3Department of Physics, Sapienza University of Rome, P.le A. Moro 2, 00185 Rome, Italy, 4INFN, Sezione di Roma1, P.le A. Moro 5, 00185 Rome, Italy and 5HHMI Janelia Farm Research Campus, 19700 Helix Drive, Ashburn, VA 20147, USA","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5056369160"],"corresponding_institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I87048295"],"apc_list":{"value":1415,"currency":"GBP","value_usd":1735},"apc_paid":{"value":1415,"currency":"GBP","value_usd":1735},"fwci":0.5137,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65873689,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2013","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/uniprot","display_name":"UniProt","score":0.9140512347221375},{"id":"https://openalex.org/keywords/human-proteome-project","display_name":"Human proteome project","score":0.7387772798538208},{"id":"https://openalex.org/keywords/proteome","display_name":"Proteome","score":0.7058287858963013},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5341129899024963},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.5206260085105896},{"id":"https://openalex.org/keywords/proteomics","display_name":"Proteomics","score":0.35653090476989746},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.30313214659690857},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.24623623490333557}],"concepts":[{"id":"https://openalex.org/C202264299","wikidata":"https://www.wikidata.org/wiki/Q905695","display_name":"UniProt","level":3,"score":0.9140512347221375},{"id":"https://openalex.org/C94795543","wikidata":"https://www.wikidata.org/wiki/Q3813754","display_name":"Human proteome project","level":4,"score":0.7387772798538208},{"id":"https://openalex.org/C104397665","wikidata":"https://www.wikidata.org/wiki/Q860947","display_name":"Proteome","level":2,"score":0.7058287858963013},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5341129899024963},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.5206260085105896},{"id":"https://openalex.org/C46111723","wikidata":"https://www.wikidata.org/wiki/Q471857","display_name":"Proteomics","level":3,"score":0.35653090476989746},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.30313214659690857},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.24623623490333557},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1093/database/bat040","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat040","pdf_url":null,"source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},{"id":"pmh:oai:europepmc.org:2668410","is_oa":false,"landing_page_url":"http://europepmc.org/articles/PMC3668385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},{"id":"pmh:oai:pubmedcentral.nih.gov:3668385","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3668385","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Database (Oxford)","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1093/database/bat040","is_oa":true,"landing_page_url":"https://doi.org/10.1093/database/bat040","pdf_url":null,"source":{"id":"https://openalex.org/S4210201630","display_name":"Database","issn_l":"1758-0463","issn":["1758-0463"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311647","host_organization_name":"University of Oxford","host_organization_lineage":["https://openalex.org/P4310311647"],"host_organization_lineage_names":["University of Oxford"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Database","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","score":0.47999998927116394,"display_name":"Life in Land"}],"awards":[{"id":"https://openalex.org/G6955215639","display_name":null,"funder_award_id":"BB/F010435/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334629","display_name":"Biotechnology and Biological Sciences Research Council","ror":"https://ror.org/00cwqg982"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2288906059","https://openalex.org/W3092794487","https://openalex.org/W2093519416","https://openalex.org/W2094752534","https://openalex.org/W1982829397","https://openalex.org/W2885268310","https://openalex.org/W2106414650","https://openalex.org/W2347437365","https://openalex.org/W2025055488","https://openalex.org/W2296132555"],"abstract_inverted_index":{"It":[0],"is":[1],"a":[2,67,229,243],"worthy":[3],"goal":[4],"to":[5,84,119,144,184,200,203,256],"completely":[6],"characterize":[7],"all":[8],"human":[9,38,52,92,115,139,252],"proteins":[10,35,131],"in":[11,28,36,99,132,176,213],"terms":[12],"of":[13,34,44,90,113,146,159,165,179,195,250,260],"their":[14,233],"domains.":[15],"Here,":[16],"using":[17],"the":[18,37,91,114,133,138,168,220,251,258],"Pfam":[19,100,237,248],"database,":[20],"we":[21,25],"asked":[22],"how":[23],"far":[24],"have":[26,272],"progressed":[27],"this":[29],"endeavour.":[30],"Ninety":[31],"per":[32,163],"cent":[33,164],"proteome":[39,116,253],"matched":[40,171],"at":[41],"least":[42],"one":[43,221],"5494":[45],"manually":[46],"curated":[47],"Pfam-A":[48,56,190],"families.":[49,161,238,262],"In":[50],"contrast,":[51],"residue":[53],"coverage":[54,249],"by":[55],"families":[57,65,197,264],"was":[58,96,117],"<45%,":[59],"with":[60,106,130,188,223],"9418":[61],"automatically":[62],"generated":[63,202],"Pfam-B":[64],"adding":[66],"further":[68],"10%.":[69],"Even":[70],"after":[71],"excluding":[72],"predicted":[73],"signal":[74],"peptide":[75],"regions":[76,79,140,209],"and":[77,103],"short":[78],"(<50":[80],"consecutive":[81],"residues)":[82],"unlikely":[83],"harbour":[85],"new":[86,196,236],"families,":[87,191],"for":[88,246],"\u223c38%":[89],"protein":[93,108,127],"residues,":[94],"there":[95],"no":[97],"information":[98],"about":[101],"conservation":[102],"evolutionary":[104],"relationship":[105,187],"other":[107,147,169],"regions.":[109,128],"This":[110,226],"uncovered":[111],"portion":[112],"found":[118],"be":[120,201,255,267],"distributed":[121],"over":[122],"almost":[123],"25":[124],"000":[125],"distinct":[126],"Comparison":[129],"UniProtKB":[134],"database":[135],"suggested":[136],"that":[137,141,193,271],"exhibited":[142],"similarity":[143],"thousands":[145,194],"sequences":[148,175],"were":[149,210],"often":[150],"either":[151],"divergent":[152],"elements":[153],"or":[154,156],"N-":[155],"C-terminal":[157],"extensions":[158],"existing":[160,189,261],"Thirty-four":[162],"regions,":[166],"on":[167,240],"hand,":[170],"fewer":[172],"than":[173],"100":[174],"UniProtKB.":[177],"Most":[178],"these":[180,207,241],"did":[181],"not":[182],"appear":[183],"share":[185],"any":[186],"suggesting":[192],"would":[198],"need":[199],"cover":[204],"them.":[205],"Also,":[206],"latter":[208],"particularly":[211],"rich":[212],"amino":[214],"acid":[215],"compositional":[216],"bias":[217],"such":[218],"as":[219],"associated":[222],"intrinsic":[224],"disorder.":[225],"could":[227],"represent":[228],"significant":[230],"obstacle":[231],"toward":[232],"inclusion":[234],"into":[235],"Based":[239],"observations,":[242],"major":[244],"focus":[245],"increasing":[247],"will":[254,265],"improve":[257],"definition":[259],"New":[263],"also":[266],"built,":[268],"prioritizing":[269],"those":[270],"been":[273],"experimentally":[274],"functionally":[275],"characterized.":[276],"Database":[277],"URL:":[278],"http://pfam.sanger.ac.uk/":[279]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
