{"id":"https://openalex.org/W2102118387","doi":"https://doi.org/10.1142/s0219720009004151","title":"AN ORFOME ASSEMBLY APPROACH TO METAGENOMICS SEQUENCES ANALYSIS","display_name":"AN ORFOME ASSEMBLY APPROACH TO METAGENOMICS SEQUENCES ANALYSIS","publication_year":2009,"publication_date":"2009-06-01","ids":{"openalex":"https://openalex.org/W2102118387","doi":"https://doi.org/10.1142/s0219720009004151","mag":"2102118387","pmid":"https://pubmed.ncbi.nlm.nih.gov/19507285"},"language":"en","primary_location":{"id":"doi:10.1142/s0219720009004151","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720009004151","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082620694","display_name":"Yuzhen Ye","orcid":"https://orcid.org/0000-0003-3707-3185"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"education","lineage":["https://openalex.org/I4210119109","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"YUZHEN YE","raw_affiliation_strings":["School of Informatics, Indiana University, Bloomington, IN 47408, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Informatics, Indiana University, Bloomington, IN 47408, USA","institution_ids":["https://openalex.org/I4210119109"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078007096","display_name":"Haixu Tang","orcid":"https://orcid.org/0000-0001-8963-8155"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"education","lineage":["https://openalex.org/I4210119109","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"HAIXU TANG","raw_affiliation_strings":["School of Informatics, Indiana University, Bloomington, IN 47408, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Informatics, Indiana University, Bloomington, IN 47408, USA","institution_ids":["https://openalex.org/I4210119109"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1909,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.87511013,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"07","issue":"03","first_page":"455","last_page":"471"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11048","display_name":"Bacteriophages and microbial interactions","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metagenomics","display_name":"Metagenomics","score":0.9712036848068237},{"id":"https://openalex.org/keywords/orfs","display_name":"ORFS","score":0.7576082348823547},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.7342691421508789},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.6379423141479492},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.5487082004547119},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4987809658050537},{"id":"https://openalex.org/keywords/genomics","display_name":"Genomics","score":0.48066389560699463},{"id":"https://openalex.org/keywords/sequence-assembly","display_name":"Sequence assembly","score":0.4517133831977844},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.37403547763824463},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.32354438304901123},{"id":"https://openalex.org/keywords/open-reading-frame","display_name":"Open reading frame","score":0.24443960189819336},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.1312439739704132}],"concepts":[{"id":"https://openalex.org/C15151743","wikidata":"https://www.wikidata.org/wiki/Q903778","display_name":"Metagenomics","level":3,"score":0.9712036848068237},{"id":"https://openalex.org/C2780530800","wikidata":"https://www.wikidata.org/wiki/Q7072921","display_name":"ORFS","level":5,"score":0.7576082348823547},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.7342691421508789},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.6379423141479492},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.5487082004547119},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4987809658050537},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.48066389560699463},{"id":"https://openalex.org/C18949551","wikidata":"https://www.wikidata.org/wiki/Q740578","display_name":"Sequence assembly","level":5,"score":0.4517133831977844},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.37403547763824463},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.32354438304901123},{"id":"https://openalex.org/C47289529","wikidata":"https://www.wikidata.org/wiki/Q908550","display_name":"Open reading frame","level":4,"score":0.24443960189819336},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.1312439739704132},{"id":"https://openalex.org/C162317418","wikidata":"https://www.wikidata.org/wiki/Q252857","display_name":"Transcriptome","level":4,"score":0.0},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005827","descriptor_name":"Genetics, Microbial","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D005827","descriptor_name":"Genetics, Microbial","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D005827","descriptor_name":"Genetics, Microbial","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D005827","descriptor_name":"Genetics, Microbial","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011110","descriptor_name":"Polymorphism, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011110","descriptor_name":"Polymorphism, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011110","descriptor_name":"Polymorphism, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011110","descriptor_name":"Polymorphism, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012623","descriptor_name":"Seawater","qualifier_ui":"Q000821","qualifier_name":"virology","is_major_topic":false},{"descriptor_ui":"D012623","descriptor_name":"Seawater","qualifier_ui":"Q000821","qualifier_name":"virology","is_major_topic":false},{"descriptor_ui":"D012623","descriptor_name":"Seawater","qualifier_ui":"Q000821","qualifier_name":"virology","is_major_topic":false},{"descriptor_ui":"D012623","descriptor_name":"Seawater","qualifier_ui":"Q000821","qualifier_name":"virology","is_major_topic":false},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016366","descriptor_name":"Open Reading Frames","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016366","descriptor_name":"Open Reading Frames","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016366","descriptor_name":"Open Reading Frames","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016366","descriptor_name":"Open Reading Frames","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":7,"locations":[{"id":"doi:10.1142/s0219720009004151","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720009004151","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},{"id":"pmid:19507285","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/19507285","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of bioinformatics and computational biology","raw_type":null},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.209.610","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.209.610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://csb2008.org/csb2008papers/022Ye.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.212.7386","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.212.7386","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.worldscibooks.com/etextbook/p585/p585_chap01.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.330.3814","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.330.3814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.icpress.co.uk/etextbook/p585/p585_chap01.pdf","raw_type":"text"},{"id":"pmh:oai:pubmedcentral.nih.gov:2829862","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Bioinform Comput Biol","raw_type":"Text"},{"id":"pmh:oai:pubmedcentral.nih.gov:2829862","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2829862","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Bioinform Comput Biol","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:2829862","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Bioinform Comput Biol","raw_type":"Text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309409","display_name":"Lilly Endowment","ror":"https://ror.org/00cpsd622"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1560556066","https://openalex.org/W1571319209","https://openalex.org/W1635391495","https://openalex.org/W1791999417","https://openalex.org/W1838357706","https://openalex.org/W1970939265","https://openalex.org/W1973862547","https://openalex.org/W1974239617","https://openalex.org/W1992950355","https://openalex.org/W1995614275","https://openalex.org/W2011084061","https://openalex.org/W2042893247","https://openalex.org/W2062681025","https://openalex.org/W2072812562","https://openalex.org/W2079706758","https://openalex.org/W2090385974","https://openalex.org/W2098290178","https://openalex.org/W2098425296","https://openalex.org/W2099809434","https://openalex.org/W2103919457","https://openalex.org/W2109656602","https://openalex.org/W2112814753","https://openalex.org/W2113601822","https://openalex.org/W2115026474","https://openalex.org/W2116895571","https://openalex.org/W2124637227","https://openalex.org/W2127230663","https://openalex.org/W2129873761","https://openalex.org/W2130595050","https://openalex.org/W2132415967","https://openalex.org/W2136651963","https://openalex.org/W2137427011","https://openalex.org/W2142113273","https://openalex.org/W2144662851","https://openalex.org/W2145336165","https://openalex.org/W2153504428","https://openalex.org/W2155845142","https://openalex.org/W2159406441","https://openalex.org/W2165460636","https://openalex.org/W2167062509","https://openalex.org/W2167673155","https://openalex.org/W4239871258"],"related_works":["https://openalex.org/W2100847587","https://openalex.org/W2039410154","https://openalex.org/W2051856433","https://openalex.org/W2140948740","https://openalex.org/W2055448750","https://openalex.org/W3134563641","https://openalex.org/W3157741229","https://openalex.org/W1834562783","https://openalex.org/W1986608492","https://openalex.org/W3098103638"],"abstract_inverted_index":{"Metagenomics":[0],"is":[1,202,229],"an":[2,152],"emerging":[3],"methodology":[4],"for":[5,31,164,232],"the":[6,26,44,48,53,91,141,157,197,206,211,220,224,236,244],"direct":[7],"genomic":[8],"analysis":[9,222],"of":[10,14,20,37,52,65,117,149,167,200,213,223,243],"a":[11,100,123,147],"mixed":[12],"community":[13],"uncultured":[15],"microorganisms.":[16],"The":[17,35,74,112,186],"current":[18],"analyses":[19],"metagenomics":[21,124,179],"data":[22,105],"largely":[23],"rely":[24],"on":[25],"computational":[27,114],"tools":[28],"originally":[29],"designed":[30],"microbial":[32],"genomics":[33],"projects.":[34],"challenge":[36],"assembling":[38],"metagenomic":[39,104,225,233],"sequences":[40],"arises":[41],"mainly":[42],"from":[43,122],"short":[45,184],"reads":[46,58,201],"and":[47,81,169,216],"high":[49],"species":[50],"complexity":[51],"community.":[54],"Alternatively,":[55],"individual":[56],"(short)":[57],"will":[59,126],"be":[60,128],"searched":[61],"directly":[62],"against":[63],"databases":[64],"known":[66],"genes":[67],"(or":[68],"proteins)":[69],"to":[70,103,177],"identify":[71],"homologous":[72,85],"sequences.":[73],"latter":[75],"approach":[76,102,176],"may":[77,88,217],"have":[78],"low":[79,182,245],"sensitivity":[80,212],"specificity":[82],"in":[83],"identifying":[84],"sequences,":[86],"which":[87],"further":[89],"bias":[90],"subsequent":[92,170],"diversity":[93,171,221],"analysis.":[94,172],"In":[95],"this":[96],"paper,":[97],"we":[98],"present":[99],"novel":[101],"analysis,":[106],"called":[107],"Metagenomic":[108],"ORFome":[109,207],"Assembly":[110],"(MetaORFA).":[111],"whole":[113],"framework":[115],"consists":[116],"three":[118],"steps.":[119],"Each":[120],"read":[121],"project":[125],"first":[127],"annotated":[129],"with":[130,181],"putative":[131],"open":[132],"reading":[133],"frames":[134],"(ORFs)":[135],"that":[136,189],"likely":[137],"encode":[138],"proteins.":[139],"Next,":[140],"predicted":[142],"ORFs":[143],"are":[144,162],"assembled":[145,158],"into":[146],"collection":[148],"peptides":[150,159,194],"using":[151],"EULER":[153],"assembly":[154,208,238],"method.":[155],"Finally,":[156],"(i.e.":[160],"ORFome)":[161],"used":[163],"database":[165],"searching":[166],"homologs":[168],"We":[173],"applied":[174],"MetaORFA":[175,190],"several":[178],"datasets":[180],"coverage":[183,199],"reads.":[185],"results":[187],"show":[188],"can":[191],"produce":[192],"long":[193],"even":[195],"when":[196,235],"sequence":[198,246],"extremely":[203],"low.":[204],"Hence,":[205],"significantly":[209],"increases":[210],"homology":[214],"searching,":[215],"potentially":[218],"improve":[219],"data.":[226],"This":[227],"improvement":[228],"especially":[230],"useful":[231],"projects":[234],"genome":[237],"does":[239],"not":[240],"work":[241],"because":[242],"coverage.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":8}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
