{"id":"https://openalex.org/W7135173540","doi":"https://doi.org/10.1016/j.compbiomed.2026.111600","title":"A systematic review and benchmarking of modern metagenomic tools for taxonomic classification","display_name":"A systematic review and benchmarking of modern metagenomic tools for taxonomic classification","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7135173540","doi":"https://doi.org/10.1016/j.compbiomed.2026.111600","pmid":"https://pubmed.ncbi.nlm.nih.gov/41830810"},"language":"en","primary_location":{"id":"doi:10.1016/j.compbiomed.2026.111600","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compbiomed.2026.111600","pdf_url":null,"source":{"id":"https://openalex.org/S44278595","display_name":"Computers in Biology and Medicine","issn_l":"0010-4825","issn":["0010-4825","1879-0534"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers in Biology and Medicine","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.compbiomed.2026.111600","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113422674","display_name":"In\u00eas Branco Martins","orcid":null},"institutions":[{"id":"https://openalex.org/I60858718","display_name":"University of Aveiro","ror":"https://ror.org/00nt41z93","country_code":"PT","type":"education","lineage":["https://openalex.org/I60858718"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"In\u00eas Branco Martins","raw_affiliation_strings":["IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal"],"affiliations":[{"raw_affiliation_string":"IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal","institution_ids":["https://openalex.org/I60858718"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126254188","display_name":"Jorge Miguel Silva","orcid":null},"institutions":[{"id":"https://openalex.org/I60858718","display_name":"University of Aveiro","ror":"https://ror.org/00nt41z93","country_code":"PT","type":"education","lineage":["https://openalex.org/I60858718"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Jorge Miguel Silva","raw_affiliation_strings":["IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal"],"affiliations":[{"raw_affiliation_string":"IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal","institution_ids":["https://openalex.org/I60858718"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126785391","display_name":"Jo\u00e3o Rafael Almeida","orcid":null},"institutions":[{"id":"https://openalex.org/I60858718","display_name":"University of Aveiro","ror":"https://ror.org/00nt41z93","country_code":"PT","type":"education","lineage":["https://openalex.org/I60858718"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Jo\u00e3o Rafael Almeida","raw_affiliation_strings":["IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal. Electronic address: joao.rafael.almeida@ua.pt"],"affiliations":[{"raw_affiliation_string":"IEETA/DETI, LASI, University of Aveiro, Campus Universit\u00e1rio de Santiago, Aveiro, 3810-193, Portugal. Electronic address: joao.rafael.almeida@ua.pt","institution_ids":["https://openalex.org/I60858718"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5126785391"],"corresponding_institution_ids":["https://openalex.org/I60858718"],"apc_list":{"value":2610,"currency":"USD","value_usd":2610},"apc_paid":{"value":2610,"currency":"USD","value_usd":2610},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.83161662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"206","issue":null,"first_page":"111600","last_page":"111600"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.508400022983551,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.508400022983551,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11048","display_name":"Bacteriophages and microbial interactions","score":0.4034999907016754,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12576","display_name":"vaccines and immunoinformatics approaches","score":0.012600000016391277,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metagenomics","display_name":"Metagenomics","score":0.8950999975204468},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.8582000136375427},{"id":"https://openalex.org/keywords/refseq","display_name":"RefSeq","score":0.6543999910354614},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5329999923706055},{"id":"https://openalex.org/keywords/biological-classification","display_name":"Biological classification","score":0.5019999742507935},{"id":"https://openalex.org/keywords/taxonomic-rank","display_name":"Taxonomic rank","score":0.41679999232292175}],"concepts":[{"id":"https://openalex.org/C15151743","wikidata":"https://www.wikidata.org/wiki/Q903778","display_name":"Metagenomics","level":3,"score":0.8950999975204468},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.8582000136375427},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6687999963760376},{"id":"https://openalex.org/C151810110","wikidata":"https://www.wikidata.org/wiki/Q7307074","display_name":"RefSeq","level":4,"score":0.6543999910354614},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5329999923706055},{"id":"https://openalex.org/C48702757","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Biological classification","level":2,"score":0.5019999742507935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47040000557899475},{"id":"https://openalex.org/C189592816","wikidata":"https://www.wikidata.org/wiki/Q427626","display_name":"Taxonomic rank","level":3,"score":0.41679999232292175},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4025999903678894},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.39800000190734863},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37459999322891235},{"id":"https://openalex.org/C189708586","wikidata":"https://www.wikidata.org/wiki/Q1504425","display_name":"Systematic review","level":3,"score":0.3156999945640564},{"id":"https://openalex.org/C2984074130","wikidata":"https://www.wikidata.org/wiki/Q73539779","display_name":"R package","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.2662000060081482},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.257999986410141}],"mesh":[{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019985","descriptor_name":"Benchmarking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D056186","descriptor_name":"Metagenomics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1016/j.compbiomed.2026.111600","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compbiomed.2026.111600","pdf_url":null,"source":{"id":"https://openalex.org/S44278595","display_name":"Computers in Biology and Medicine","issn_l":"0010-4825","issn":["0010-4825","1879-0534"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers in Biology and Medicine","raw_type":"journal-article"},{"id":"pmid:41830810","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41830810","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers in biology and medicine","raw_type":null}],"best_oa_location":{"id":"doi:10.1016/j.compbiomed.2026.111600","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compbiomed.2026.111600","pdf_url":null,"source":{"id":"https://openalex.org/S44278595","display_name":"Computers in Biology and Medicine","issn_l":"0010-4825","issn":["0010-4825","1879-0534"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers in Biology and Medicine","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2045204781","https://openalex.org/W2055043387","https://openalex.org/W2107903949","https://openalex.org/W2595593998","https://openalex.org/W2773939681","https://openalex.org/W2918965813","https://openalex.org/W2968450569","https://openalex.org/W3217463608","https://openalex.org/W4225258284","https://openalex.org/W4291017687","https://openalex.org/W4298087616","https://openalex.org/W4324129364","https://openalex.org/W4379743275","https://openalex.org/W4392662892","https://openalex.org/W4401570038"],"related_works":[],"abstract_inverted_index":{"Advancements":[0],"in":[1,39,108],"metagenomics":[2],"have":[3],"been":[4],"driven":[5],"by":[6,155],"the":[7,21,64,76,92,165],"continuous":[8],"development":[9],"of":[10,24,56,101,197],"bioinformatic":[11],"tools,":[12,67,166,193],"particularly":[13],"taxonomic":[14,60],"classification":[15,61],"software,":[16],"which":[17],"are":[18,104],"central":[19],"to":[20,37],"accurate":[22],"characterization":[23],"microbial":[25],"communities.":[26],"However,":[27],"establishing":[28],"direct":[29],"comparisons":[30],"between":[31],"these":[32,102],"tools":[33,103,172,177],"remains":[34],"challenging":[35],"due":[36],"variations":[38],"evaluation":[40],"metrics,":[41],"reference":[42],"databases,":[43],"and":[44,72,83,115,125,169,183,200],"input":[45],"data":[46],"types.":[47],"In":[48],"this":[49],"study,":[50],"we":[51],"present":[52],"a":[53,87],"systematic":[54],"review":[55,187],"recently":[57],"developed":[58],"metagenomic":[59],"tools.":[62],"Of":[63],"31":[65],"identified":[66],"nine":[68],"satisfied":[69],"all":[70],"functional":[71],"methodological":[73],"criteria":[74],"for":[75,120,130,191],"benchmark":[77],"analysis.":[78],"We":[79],"evaluated":[80],"their":[81,198],"accuracy":[82,119,129],"computational":[84,201],"performance":[85,189],"using":[86],"standardized":[88],"dataset":[89],"derived":[90],"from":[91],"NCBI":[93],"RefSeq":[94],"database.":[95],"Our":[96],"analysis":[97],"revealed":[98],"that":[99],"most":[100,139],"domain-specific,":[105],"each":[106],"excelling":[107],"particular":[109],"areas.":[110],"Tools":[111],"like":[112,178],"TAMA,":[113],"CAMITAX":[114],"PhyloFlash":[116],"achieved":[117,127,134],"higher":[118,128],"prokaryotic":[121],"organisms,":[122],"while":[123,176],"ViWrap":[124],"PhaBOX":[126],"viral":[131],"classifications.":[132],"SqueezeMeta":[133],"high":[135],"F1":[136],"scores":[137],"across":[138],"domains,":[140],"though":[141],"its":[142],"assembly-based":[143],"architecture":[144],"limits":[145],"effectiveness":[146],"on":[147],"highly":[148],"diverse":[149],"samples.":[150],"MegaPath-Nano":[151],"was":[152],"least":[153],"affected":[154],"increased":[156],"mutation":[157],"rates.":[158],"The":[159],"execution":[160],"time":[161],"varied":[162],"widely":[163],"among":[164],"with":[167],"domain-specific":[168],"machine":[170],"learning-based":[171],"generally":[173],"being":[174],"faster,":[175],"BASTA":[179],"had":[180],"longer":[181],"runtimes":[182],"lower":[184],"accuracy.":[185],"This":[186],"synthesizes":[188],"results":[190],"current":[192],"providing":[194],"an":[195],"overview":[196],"strengths":[199],"methodologies.":[202]},"counts_by_year":[],"updated_date":"2026-03-24T08:02:53.985720","created_date":"2026-03-14T00:00:00"}
