{"id":"https://openalex.org/W2014097763","doi":"https://doi.org/10.1186/1471-2105-13-264","title":"Sifting through genomes with iterative-sequence clustering produces a large, phylogenetically diverse protein-family resource","display_name":"Sifting through genomes with iterative-sequence clustering produces a large, phylogenetically diverse protein-family resource","publication_year":2012,"publication_date":"2012-10-13","ids":{"openalex":"https://openalex.org/W2014097763","doi":"https://doi.org/10.1186/1471-2105-13-264","mag":"2014097763","pmid":"https://pubmed.ncbi.nlm.nih.gov/23061897"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-13-264","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-264","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-264","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-264","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076795528","display_name":"Thomas J. Sharpton","orcid":"https://orcid.org/0000-0002-5996-7764"},"institutions":[{"id":"https://openalex.org/I180670191","display_name":"University of California, San Francisco","ror":"https://ror.org/043mz5j54","country_code":"US","type":"education","lineage":["https://openalex.org/I180670191"]},{"id":"https://openalex.org/I1321430492","display_name":"Gladstone Institutes","ror":"https://ror.org/038321296","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1321430492"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Thomas J Sharpton","raw_affiliation_strings":["The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA 94158, USA. thomas.sharpton@gladstone.ucsf.edu","The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA, 94158, USA"],"affiliations":[{"raw_affiliation_string":"The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA 94158, USA. thomas.sharpton@gladstone.ucsf.edu","institution_ids":["https://openalex.org/I1321430492"]},{"raw_affiliation_string":"The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA, 94158, USA","institution_ids":["https://openalex.org/I1321430492","https://openalex.org/I180670191"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086222406","display_name":"Guillaume Jospin","orcid":"https://orcid.org/0000-0002-8746-2632"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guillaume Jospin","raw_affiliation_strings":["UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA"],"affiliations":[{"raw_affiliation_string":"UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043047513","display_name":"Dongying Wu","orcid":"https://orcid.org/0000-0002-4167-2212"},"institutions":[{"id":"https://openalex.org/I196679689","display_name":"Joint Genome Institute","ror":"https://ror.org/04xm1d337","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I196679689","https://openalex.org/I39565521"]},{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dongying Wu","raw_affiliation_strings":["Department of Energy Joint Genome Institute, Walnut Creek, CA, 94598, USA","UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA"],"affiliations":[{"raw_affiliation_string":"Department of Energy Joint Genome Institute, Walnut Creek, CA, 94598, USA","institution_ids":["https://openalex.org/I196679689"]},{"raw_affiliation_string":"UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061354858","display_name":"Morgan G. I. Langille","orcid":"https://orcid.org/0000-0002-6604-3009"},"institutions":[{"id":"https://openalex.org/I129902397","display_name":"Dalhousie University","ror":"https://ror.org/01e6qks80","country_code":"CA","type":"education","lineage":["https://openalex.org/I129902397"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Morgan GI Langille","raw_affiliation_strings":["Department of Biochemistry & Molecular Biology, Dalhousie University, Halifax, Nova Scotia, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Biochemistry & Molecular Biology, Dalhousie University, Halifax, Nova Scotia, Canada","institution_ids":["https://openalex.org/I129902397"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005062415","display_name":"Katherine S. Pollard","orcid":"https://orcid.org/0000-0002-9870-6196"},"institutions":[{"id":"https://openalex.org/I180670191","display_name":"University of California, San Francisco","ror":"https://ror.org/043mz5j54","country_code":"US","type":"education","lineage":["https://openalex.org/I180670191"]},{"id":"https://openalex.org/I1321430492","display_name":"Gladstone Institutes","ror":"https://ror.org/038321296","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1321430492"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Katherine S Pollard","raw_affiliation_strings":["Department of Epidemiology & Biostatistics, Institute for Human Genetics, University of California San Francisco, San Francisco, CA, 94158, USA","The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA, 94158, USA"],"affiliations":[{"raw_affiliation_string":"Department of Epidemiology & Biostatistics, Institute for Human Genetics, University of California San Francisco, San Francisco, CA, 94158, USA","institution_ids":["https://openalex.org/I180670191"]},{"raw_affiliation_string":"The J. David Gladstone Institutes, University of California San Francisco, San Francisco, CA, 94158, USA","institution_ids":["https://openalex.org/I1321430492","https://openalex.org/I180670191"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059066311","display_name":"Jonathan A. Eisen","orcid":"https://orcid.org/0000-0002-0159-2197"},"institutions":[{"id":"https://openalex.org/I4210160527","display_name":"University of California Davis Medical Center","ror":"https://ror.org/05t6gpm70","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210160527","https://openalex.org/I4210160856"]},{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]},{"id":"https://openalex.org/I196679689","display_name":"Joint Genome Institute","ror":"https://ror.org/04xm1d337","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I196679689","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan A Eisen","raw_affiliation_strings":["Department of Energy Joint Genome Institute, Walnut Creek, CA, 94598, USA","Deptartment of Evolution and Ecology, University of California, Davis, Davis, CA, 95616, USA","Deptartment of Medical Microbiology and Immunology, University of California, Davis, Davis, CA, 95616, USA","UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA"],"affiliations":[{"raw_affiliation_string":"Department of Energy Joint Genome Institute, Walnut Creek, CA, 94598, USA","institution_ids":["https://openalex.org/I196679689"]},{"raw_affiliation_string":"Deptartment of Evolution and Ecology, University of California, Davis, Davis, CA, 95616, USA","institution_ids":["https://openalex.org/I84218800"]},{"raw_affiliation_string":"Deptartment of Medical Microbiology and Immunology, University of California, Davis, Davis, CA, 95616, USA","institution_ids":["https://openalex.org/I4210160527","https://openalex.org/I84218800"]},{"raw_affiliation_string":"UC Davis Genome Center, University of California, Davis, Davis, CA, 95616, USA","institution_ids":["https://openalex.org/I84218800"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5076795528"],"corresponding_institution_ids":["https://openalex.org/I1321430492","https://openalex.org/I180670191"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":1.2102,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.77505896,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"13","issue":"1","first_page":"264","last_page":"264"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10012","display_name":"Genetic diversity and population structure","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.672988772392273},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5804124474525452},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5549980998039246},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5509502291679382},{"id":"https://openalex.org/keywords/protein-family","display_name":"Protein family","score":0.5269055366516113},{"id":"https://openalex.org/keywords/phylogenetic-tree","display_name":"Phylogenetic tree","score":0.453596293926239},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4488707184791565},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.44824913144111633},{"id":"https://openalex.org/keywords/genomics","display_name":"Genomics","score":0.4448775351047516},{"id":"https://openalex.org/keywords/comparative-genomics","display_name":"Comparative genomics","score":0.4382193088531494},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.4286021590232849},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.34852907061576843},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.19913941621780396},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.14256826043128967},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.13796457648277283}],"concepts":[{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.672988772392273},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5804124474525452},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5549980998039246},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5509502291679382},{"id":"https://openalex.org/C171897839","wikidata":"https://www.wikidata.org/wiki/Q417841","display_name":"Protein family","level":3,"score":0.5269055366516113},{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.453596293926239},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4488707184791565},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.44824913144111633},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.4448775351047516},{"id":"https://openalex.org/C105176652","wikidata":"https://www.wikidata.org/wiki/Q1147112","display_name":"Comparative genomics","level":5,"score":0.4382193088531494},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.4286021590232849},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.34852907061576843},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.19913941621780396},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.14256826043128967},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.13796457648277283},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D058977","descriptor_name":"Molecular Sequence Annotation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D058977","descriptor_name":"Molecular Sequence Annotation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D058977","descriptor_name":"Molecular Sequence Annotation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":6,"locations":[{"id":"doi:10.1186/1471-2105-13-264","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-264","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-264","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:23061897","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/23061897","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:f45c61462668426eb94184e4386985ff","is_oa":true,"landing_page_url":"https://doaj.org/article/f45c61462668426eb94184e4386985ff","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 13, Iss 1, p 264 (2012)","raw_type":"article"},{"id":"pmh:oai:escholarship.org/ark:/13030/qt3gc843kb","is_oa":false,"landing_page_url":"https://escholarship.org/uc/item/3gc843kb","pdf_url":null,"source":{"id":"https://openalex.org/S4306400115","display_name":"eScholarship (California Digital Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2801248553","host_organization_name":"California Digital Library","host_organization_lineage":["https://openalex.org/I2801248553"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, vol 13, iss 1","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:3481395","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3481395","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"},{"id":"pmh:qt3gc843kb","is_oa":false,"landing_page_url":"http://www.escholarship.org/uc/item/3gc843kb","pdf_url":null,"source":{"id":"https://openalex.org/S4306400115","display_name":"eScholarship (California Digital Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2801248553","host_organization_name":"California Digital Library","host_organization_lineage":["https://openalex.org/I2801248553"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Sharpton, Thomas J; Jospin, Guillaume; Wu, Dongying; Langille, Morgan GI; Pollard, Katherine S; &amp; Eisen, Jonathan A. (2012). Sifting through genomes with iterative-sequence clustering produces a large, phylogenetically diverse protein-family resource. BMC Bioinformatics, 13(1), 264. doi: http://dx.doi.org/10.1186/1471-2105-13-264. Retrieved from: http://www.escholarship.org/uc/item/3gc843kb","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-13-264","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-264","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-264","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3747166797","display_name":"Exploring the Niche Space of Human Microbiome Functions through Convex Geometry and Evolutionary Genomics","funder_award_id":"1069303","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5533717888","display_name":null,"funder_award_id":"DMS-1069303","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7340972926","display_name":null,"funder_award_id":"other","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G782520783","display_name":null,"funder_award_id":"#3300","funder_id":"https://openalex.org/F4320306202","funder_display_name":"Gordon and Betty Moore Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320306202","display_name":"Gordon and Betty Moore Foundation","ror":"https://ror.org/006wxqw41"},{"id":"https://openalex.org/F4320316170","display_name":"Joint Genome Institute","ror":"https://ror.org/04xm1d337"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2014097763.pdf","grobid_xml":"https://content.openalex.org/works/W2014097763.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W181377306","https://openalex.org/W229097380","https://openalex.org/W1791999417","https://openalex.org/W1966952999","https://openalex.org/W1975970608","https://openalex.org/W1990453950","https://openalex.org/W2017608260","https://openalex.org/W2019216543","https://openalex.org/W2031611770","https://openalex.org/W2045765967","https://openalex.org/W2052316443","https://openalex.org/W2055043387","https://openalex.org/W2091232725","https://openalex.org/W2097107919","https://openalex.org/W2097485877","https://openalex.org/W2111211467","https://openalex.org/W2111373249","https://openalex.org/W2119027485","https://openalex.org/W2122613768","https://openalex.org/W2124166542","https://openalex.org/W2124410686","https://openalex.org/W2132926880","https://openalex.org/W2134819521","https://openalex.org/W2138122982","https://openalex.org/W2141885858","https://openalex.org/W2150550043","https://openalex.org/W2159482845","https://openalex.org/W2161062388","https://openalex.org/W2161762698","https://openalex.org/W2163500926","https://openalex.org/W2166705366","https://openalex.org/W2169900015","https://openalex.org/W2741071058","https://openalex.org/W4294216483","https://openalex.org/W4320301318"],"related_works":["https://openalex.org/W1565527690","https://openalex.org/W1493660383","https://openalex.org/W2759519215","https://openalex.org/W4318240630","https://openalex.org/W2353729507","https://openalex.org/W2350466590","https://openalex.org/W1542620732","https://openalex.org/W3031625301","https://openalex.org/W4386771068","https://openalex.org/W2080758876"],"abstract_inverted_index":{"We":[0],"describe":[1],"the":[2],"rapid":[3],"identification":[4],"of":[5],"SFams":[6],"and":[7,17,32,38,43],"demonstrate":[8],"how":[9],"they":[10],"can":[11],"be":[12,45],"used":[13],"to":[14,47],"annotate":[15],"genomes":[16],"metagenomes.":[18],"The":[19],"SFam":[20],"database":[21,39],"catalogs":[22],"protein-family":[23],"quality":[24],"metrics,":[25],"multiple":[26],"sequence":[27],"alignments,":[28],"hidden":[29],"Markov":[30],"models,":[31],"phylogenetic":[33],"trees.":[34],"Our":[35],"source":[36],"code":[37],"are":[40],"publicly":[41],"available":[42],"will":[44],"subject":[46],"frequent":[48],"updates":[49],"(http://edhar.genomecenter.ucdavis.edu/sifting_families/).":[50]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
