{"id":"https://openalex.org/W2620103645","doi":"https://doi.org/10.1186/s12859-017-1668-y","title":"In silico approach to designing rational metagenomic libraries for functional studies","display_name":"In silico approach to designing rational metagenomic libraries for functional studies","publication_year":2017,"publication_date":"2017-05-22","ids":{"openalex":"https://openalex.org/W2620103645","doi":"https://doi.org/10.1186/s12859-017-1668-y","mag":"2620103645","pmid":"https://pubmed.ncbi.nlm.nih.gov/28532384"},"language":"en","primary_location":{"id":"doi:10.1186/s12859-017-1668-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-017-1668-y","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-017-1668-y","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-017-1668-y","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036598163","display_name":"Anna Kusnezowa","orcid":null},"institutions":[{"id":"https://openalex.org/I904495901","display_name":"Ruhr University Bochum","ror":"https://ror.org/04tsk2644","country_code":"DE","type":"education","lineage":["https://openalex.org/I904495901"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Anna Kusnezowa","raw_affiliation_strings":["Institute of Biochemistry and Pathobiochemistry - Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany","Institute of Biochemistry and Pathobiochemistry \u2013 Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Biochemistry and Pathobiochemistry - Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany","institution_ids":[]},{"raw_affiliation_string":"Institute of Biochemistry and Pathobiochemistry \u2013 Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany","institution_ids":["https://openalex.org/I904495901"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003029797","display_name":"Lars I. Leichert","orcid":"https://orcid.org/0000-0002-5666-9681"},"institutions":[{"id":"https://openalex.org/I904495901","display_name":"Ruhr University Bochum","ror":"https://ror.org/04tsk2644","country_code":"DE","type":"education","lineage":["https://openalex.org/I904495901"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lars I. Leichert","raw_affiliation_strings":["Institute of Biochemistry and Pathobiochemistry - Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany. lars.leichert@ruhr-uni-bochum.de","Institute of Biochemistry and Pathobiochemistry \u2013 Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Biochemistry and Pathobiochemistry - Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany. lars.leichert@ruhr-uni-bochum.de","institution_ids":[]},{"raw_affiliation_string":"Institute of Biochemistry and Pathobiochemistry \u2013 Microbial Biochemistry, Ruhr University Bochum, Universit\u00e4tsstr. 150, 44780, Bochum, Germany","institution_ids":["https://openalex.org/I904495901"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5036598163"],"corresponding_institution_ids":["https://openalex.org/I904495901"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1661,"currency":"EUR","value_usd":1791},"fwci":0.3365,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.59776969,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"18","issue":"1","first_page":"267","last_page":"267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.2904999852180481,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.2904999852180481,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.22679999470710754,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.0737999975681305,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metagenomics","display_name":"Metagenomics","score":0.8120927214622498},{"id":"https://openalex.org/keywords/in-silico","display_name":"In silico","score":0.7552490234375},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.6873784065246582},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.6205569505691528},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.5584375262260437},{"id":"https://openalex.org/keywords/homology","display_name":"Homology (biology)","score":0.5212008357048035},{"id":"https://openalex.org/keywords/protein-function-prediction","display_name":"Protein function prediction","score":0.45065850019454956},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.43214553594589233},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.4176161289215088},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.41212669014930725},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.3839857280254364},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.3398614525794983},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3328087329864502},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.2925668954849243},{"id":"https://openalex.org/keywords/protein-function","display_name":"Protein function","score":0.2739065885543823},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.16524434089660645},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.15608641505241394}],"concepts":[{"id":"https://openalex.org/C15151743","wikidata":"https://www.wikidata.org/wiki/Q903778","display_name":"Metagenomics","level":3,"score":0.8120927214622498},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.7552490234375},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.6873784065246582},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.6205569505691528},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.5584375262260437},{"id":"https://openalex.org/C165525559","wikidata":"https://www.wikidata.org/wiki/Q224180","display_name":"Homology (biology)","level":3,"score":0.5212008357048035},{"id":"https://openalex.org/C207060522","wikidata":"https://www.wikidata.org/wiki/Q7251473","display_name":"Protein function prediction","level":4,"score":0.45065850019454956},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.43214553594589233},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.4176161289215088},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.41212669014930725},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3839857280254364},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.3398614525794983},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3328087329864502},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.2925668954849243},{"id":"https://openalex.org/C2986374874","wikidata":"https://www.wikidata.org/wiki/Q8054","display_name":"Protein function","level":3,"score":0.2739065885543823},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.16524434089660645},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.15608641505241394}],"mesh":[{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008066","descriptor_name":"Lipolysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008066","descriptor_name":"Lipolysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008066","descriptor_name":"Lipolysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009792","descriptor_name":"Oceans and Seas","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009792","descriptor_name":"Oceans and Seas","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009792","descriptor_name":"Oceans and Seas","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015723","descriptor_name":"Gene Library","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015723","descriptor_name":"Gene Library","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015723","descriptor_name":"Gene Library","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D054892","descriptor_name":"Metagenome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D054892","descriptor_name":"Metagenome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D054892","descriptor_name":"Metagenome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D056186","descriptor_name":"Metagenomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D056186","descriptor_name":"Metagenomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D056186","descriptor_name":"Metagenomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":5,"locations":[{"id":"doi:10.1186/s12859-017-1668-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-017-1668-y","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-017-1668-y","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:28532384","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/28532384","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:5e541417706a4fe89b2d5de7ee371fd6","is_oa":true,"landing_page_url":"https://doaj.org/article/5e541417706a4fe89b2d5de7ee371fd6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 18, Iss 1, Pp 1-11 (2017)","raw_type":"article"},{"id":"pmh:oai:europepmc.org:4291834","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/5441078","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:hss-opus.ub.ruhr-uni-bochum.de:5896","is_oa":true,"landing_page_url":"https://nbn-resolving.org/urn:nbn:de:hbz:294-58968","pdf_url":null,"source":{"id":"https://openalex.org/S4306400167","display_name":"Dokumentenrepositorium der RUB (Ruhr University Bochum)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I904495901","host_organization_name":"Ruhr University Bochum","host_organization_lineage":["https://openalex.org/I904495901"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"doc-type:article"}],"best_oa_location":{"id":"doi:10.1186/s12859-017-1668-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-017-1668-y","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/s12859-017-1668-y","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Life below water","score":0.8799999952316284,"id":"https://metadata.un.org/sdg/14"}],"awards":[{"id":"https://openalex.org/G1423456925","display_name":null,"funder_award_id":"A 534A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G1564535905","display_name":null,"funder_award_id":"FKZ 031","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G227648021","display_name":null,"funder_award_id":"031 A 534A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G3202512810","display_name":null,"funder_award_id":"FKZ 031 A 534A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G4727763261","display_name":"Functional Metagenomics \u2013 Harnessing the Biotechnological Potential of Completely Novel Protein Families","funder_award_id":"281384","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G5593277320","display_name":null,"funder_award_id":"2007-2013","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8382178641","display_name":null,"funder_award_id":"281384\u2013FuMe","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"},{"id":"https://openalex.org/G8842930235","display_name":null,"funder_award_id":"FKZ 031 A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G892962579","display_name":null,"funder_award_id":"FKZ 031 A 534A","funder_id":"https://openalex.org/F4320330124","funder_display_name":"German Network for Bioinformatics Infrastructure"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"},{"id":"https://openalex.org/F4320330124","display_name":"German Network for Bioinformatics Infrastructure","ror":null},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2620103645.pdf","grobid_xml":"https://content.openalex.org/works/W2620103645.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W97059505","https://openalex.org/W801829339","https://openalex.org/W1519266993","https://openalex.org/W1762307288","https://openalex.org/W1791999417","https://openalex.org/W1943327251","https://openalex.org/W1968923826","https://openalex.org/W1977345694","https://openalex.org/W1996901532","https://openalex.org/W2021883973","https://openalex.org/W2062767843","https://openalex.org/W2108982334","https://openalex.org/W2111373249","https://openalex.org/W2117486996","https://openalex.org/W2120172561","https://openalex.org/W2127774996","https://openalex.org/W2138122982","https://openalex.org/W2141885858","https://openalex.org/W2145000359","https://openalex.org/W2149296309","https://openalex.org/W2156125289","https://openalex.org/W2159957100","https://openalex.org/W2164461702","https://openalex.org/W2168036974","https://openalex.org/W2186025959","https://openalex.org/W2739999456","https://openalex.org/W4320301318","https://openalex.org/W6655972840"],"related_works":["https://openalex.org/W2079145549","https://openalex.org/W2012129103","https://openalex.org/W4389053053","https://openalex.org/W2903170547","https://openalex.org/W2339549279","https://openalex.org/W1985522665","https://openalex.org/W2145268834","https://openalex.org/W2156226201","https://openalex.org/W2041545801","https://openalex.org/W1801992990"],"abstract_inverted_index":{"BACKGROUND:":[0],"With":[1],"the":[2,9,42,73,101,175,209,226],"development":[3],"of":[4,11,24,44,50,75,92,122,130,135,189,229],"Next":[5],"Generation":[6],"Sequencing":[7],"technologies,":[8],"number":[10,74,85],"predicted":[12,98],"proteins":[13,51,76,99,137,181],"from":[14,32,77,100,157],"entire":[15,78,234],"(meta-)":[16,79,235],"genomes":[17,80,236],"has":[18],"risen":[19],"exponentially.":[20],"While":[21],"for":[22,41,86,238],"some":[23],"these":[25,136,202],"sequences":[26],"protein":[27,45,149],"functions":[28],"can":[29],"be":[30,139],"inferred":[31],"homology,":[33],"an":[34,69,218],"experimental":[35,88],"characterization":[36,49,89],"is":[37],"still":[38],"a":[39,82,170],"requirement":[40],"determination":[43],"function.":[46],"However,":[47],"functional":[48,230],"cannot":[52],"keep":[53],"pace":[54],"with":[55],"our":[56,214],"capabilities":[57],"to":[58,71,81,116,178,196],"generate":[59],"more":[60,62],"and":[61,198,232],"sequence":[63],"data.":[64],"RESULTS:":[65],"Here,":[66],"we":[67,159,167,206,222],"present":[68],"approach":[70],"reduce":[72],"reasonably":[83],"small":[84],"further":[87],"without":[90],"loss":[91],"important":[93],"information.":[94],"About":[95],"6.1":[96],"million":[97,134],"Global":[102],"Ocean":[103],"Sampling":[104],"Expedition":[105],"Metagenome":[106],"project":[107],"were":[108,223],"distributed":[109],"into":[110],"classes":[111],"based":[112,192],"either":[113],"on":[114,193],"homology":[115,177,195],"existing":[117,155],"hidden":[118],"markov":[119],"models":[120],"(HMMs)":[121],"known":[123,197],"families,":[124,150],"or":[125],"de":[126],"novo":[127],"by":[128],"assessment":[129],"pairwise":[131],"similarity.":[132],"5.1":[133],"could":[138,160,207],"classified":[140],"in":[141,182,219],"this":[142,183],"way,":[143],"yielding":[144],"18,437":[145],"families.":[146],"For":[147,164],"4,129":[148],"which":[151,173],"did":[152],"not":[153],"match":[154],"HMMs":[156],"databases,":[158],"create":[161],"novel":[162,210],"HMMs.":[163],"each":[165],"family,":[166],"then":[168,186],"selected":[169,187],"representative":[171],"protein,":[172],"showed":[174],"closest":[176],"all":[179],"other":[180],"family.":[184],"We":[185],"representatives":[188],"four":[190,203],"families":[191],"their":[194],"well-characterized":[199],"lipases.":[200],"From":[201],"synthesized":[204],"genes,":[205],"obtain":[208],"esterase/lipase":[211],"GOS54,":[212],"validating":[213],"approach.":[215],"CONCLUSIONS:":[216],"Using":[217],"silico":[220],"approach,":[221],"able":[224],"improve":[225],"success":[227],"rate":[228],"screening":[231],"make":[233],"amenable":[237],"biochemical":[239],"characterization.":[240]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
