{"id":"https://openalex.org/W4313598914","doi":"https://doi.org/10.1371/journal.pcbi.1010820","title":"Over-optimism in unsupervised microbiome analysis: Insights from network learning and clustering","display_name":"Over-optimism in unsupervised microbiome analysis: Insights from network learning and clustering","publication_year":2023,"publication_date":"2023-01-06","ids":{"openalex":"https://openalex.org/W4313598914","doi":"https://doi.org/10.1371/journal.pcbi.1010820","pmid":"https://pubmed.ncbi.nlm.nih.gov/36608142"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1010820","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1010820","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1010820&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1010820&type=printable","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040820559","display_name":"Theresa Ullmann","orcid":"https://orcid.org/0000-0003-1215-8561"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]},{"id":"https://openalex.org/I4403386549","display_name":"Munich Center for Machine Learning","ror":"https://ror.org/02nfy3535","country_code":null,"type":"education","lineage":["https://openalex.org/I4403386549","https://openalex.org/I62916508","https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Theresa Ullmann","raw_affiliation_strings":["Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","Munich Center for Machine Learning (MCML), M\u00fcnchen, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Munich Center for Machine Learning (MCML), M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I4403386549"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082908973","display_name":"Stefanie Peschel","orcid":"https://orcid.org/0000-0002-7936-7627"},"institutions":[{"id":"https://openalex.org/I3018134672","display_name":"Helmholtz Zentrum M\u00fcnchen","ror":"https://ror.org/00cfam450","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I3018134672"]},{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Stefanie Peschel","raw_affiliation_strings":["Department of Statistics, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","Institute for Asthma and Allergy Prevention, Helmholtz Zentrum M\u00fcnchen, Neuherberg, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Statistics, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Institute for Asthma and Allergy Prevention, Helmholtz Zentrum M\u00fcnchen, Neuherberg, Germany","institution_ids":["https://openalex.org/I3018134672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085691045","display_name":"Philipp Finger","orcid":null},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Philipp Finger","raw_affiliation_strings":["Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020021560","display_name":"Christian L. M\u00fcller","orcid":"https://orcid.org/0000-0002-3821-7083"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]},{"id":"https://openalex.org/I3018134672","display_name":"Helmholtz Zentrum M\u00fcnchen","ror":"https://ror.org/00cfam450","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I3018134672"]},{"id":"https://openalex.org/I4210153546","display_name":"Flatiron Health (United States)","ror":"https://ror.org/0508h6p74","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153546"]}],"countries":["DE","US"],"is_corresponding":true,"raw_author_name":"Christian L. M\u00fcller","raw_affiliation_strings":["Center for Computational Mathematics, Flatiron Institute, New York, New York, United States of America","Department of Statistics, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","Institute of Computational Biology, Helmholtz Zentrum M\u00fcnchen, Neuherberg, Germany"],"affiliations":[{"raw_affiliation_string":"Center for Computational Mathematics, Flatiron Institute, New York, New York, United States of America","institution_ids":["https://openalex.org/I4210153546"]},{"raw_affiliation_string":"Department of Statistics, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Institute of Computational Biology, Helmholtz Zentrum M\u00fcnchen, Neuherberg, Germany","institution_ids":["https://openalex.org/I3018134672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015152016","display_name":"Anne\u2010Laure Boulesteix","orcid":"https://orcid.org/0000-0002-2729-0947"},"institutions":[{"id":"https://openalex.org/I4403386549","display_name":"Munich Center for Machine Learning","ror":"https://ror.org/02nfy3535","country_code":null,"type":"education","lineage":["https://openalex.org/I4403386549","https://openalex.org/I62916508","https://openalex.org/I8204097"]},{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Anne-Laure Boulesteix","raw_affiliation_strings":["Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","Munich Center for Machine Learning (MCML), M\u00fcnchen, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Medical Information Processing, Biometry, and Epidemiology, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I8204097"]},{"raw_affiliation_string":"Munich Center for Machine Learning (MCML), M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I4403386549"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5015152016","https://openalex.org/A5020021560","https://openalex.org/A5040820559","https://openalex.org/A5082908973","https://openalex.org/A5085691045"],"corresponding_institution_ids":["https://openalex.org/I3018134672","https://openalex.org/I4210153546","https://openalex.org/I4403386549","https://openalex.org/I8204097"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":3203,"currency":"EUR","value_usd":3454},"fwci":1.5788,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.8230368,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"19","issue":"1","first_page":"e1010820","last_page":"e1010820"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10066","display_name":"Gut microbiota and health","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10066","display_name":"Gut microbiota and health","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microbiome","display_name":"Microbiome","score":0.6658709049224854},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6133129596710205},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.6069637537002563},{"id":"https://openalex.org/keywords/optimism","display_name":"Optimism","score":0.5248896479606628},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.46169981360435486},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.42824786901474},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3791583776473999},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3453372120857239},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.34455564618110657},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.3253334164619446},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.28214752674102783}],"concepts":[{"id":"https://openalex.org/C143121216","wikidata":"https://www.wikidata.org/wiki/Q1330402","display_name":"Microbiome","level":2,"score":0.6658709049224854},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6133129596710205},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.6069637537002563},{"id":"https://openalex.org/C204017024","wikidata":"https://www.wikidata.org/wiki/Q485446","display_name":"Optimism","level":2,"score":0.5248896479606628},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.46169981360435486},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42824786901474},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3791583776473999},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3453372120857239},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.34455564618110657},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3253334164619446},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.28214752674102783},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001419","descriptor_name":"Bacteria","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016000","descriptor_name":"Cluster Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D059013","descriptor_name":"Microbial Consortia","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D059013","descriptor_name":"Microbial Consortia","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D059013","descriptor_name":"Microbial Consortia","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D064307","descriptor_name":"Microbiota","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D064307","descriptor_name":"Microbiota","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D064307","descriptor_name":"Microbiota","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":7,"locations":[{"id":"doi:10.1371/journal.pcbi.1010820","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1010820","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1010820&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},{"id":"pmid:36608142","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36608142","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:epub.ub.uni-muenchen.de:94621","is_oa":true,"landing_page_url":"http://nbn-resolving.de/urn:nbn:de:bvb:19-epub-94621-2","pdf_url":"https://epub.ub.uni-muenchen.de/94621/","source":{"id":"https://openalex.org/S4306401845","display_name":"Open access LMU (Ludwid Maxmilian's Universitat Munchen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I8204097","host_organization_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","host_organization_lineage":["https://openalex.org/I8204097"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology","raw_type":"doc-type:article"},{"id":"pmh:oai:pubmedcentral.nih.gov:9873197","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9873197","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC9873197/pdf/pcbi.1010820.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Comput Biol","raw_type":"Text"},{"id":"pmh:oai:RePEc:plo:pcbi00:1010820","is_oa":false,"landing_page_url":"https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1010820","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:doaj.org/article:71e68bf1a3304669b4dab07b57c290ef","is_oa":true,"landing_page_url":"https://doaj.org/article/71e68bf1a3304669b4dab07b57c290ef","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 19, Iss 1, p e1010820 (2023)","raw_type":"article"},{"id":"pmh:oai:push-zb.helmholtz-munich.de:67183","is_oa":false,"landing_page_url":"https://push-zb.helmholtz-munich.de/frontdoor.php?source_opus=67183","pdf_url":null,"source":{"id":"https://openalex.org/S7407055352","display_name":"PuSH - Publication Server of Helmholtz Zentrum M\u00fcnchen","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Comput. Biol. 19:e1010820 (2023)","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1010820","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1010820","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1010820&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1627710804","display_name":null,"funder_award_id":"BO3139/7-1","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G2734144814","display_name":null,"funder_award_id":"Munich","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G3467264548","display_name":null,"funder_award_id":"01IS18036A","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4313598914.pdf","grobid_xml":"https://content.openalex.org/works/W4313598914.grobid-xml"},"referenced_works_count":80,"referenced_works":["https://openalex.org/W178619957","https://openalex.org/W229097380","https://openalex.org/W1493454437","https://openalex.org/W1897139626","https://openalex.org/W1968105193","https://openalex.org/W1987184081","https://openalex.org/W1987971958","https://openalex.org/W2005852722","https://openalex.org/W2010824638","https://openalex.org/W2028221693","https://openalex.org/W2032230795","https://openalex.org/W2044712133","https://openalex.org/W2047020168","https://openalex.org/W2047940964","https://openalex.org/W2052969143","https://openalex.org/W2053801811","https://openalex.org/W2056944867","https://openalex.org/W2083717261","https://openalex.org/W2111358533","https://openalex.org/W2112408821","https://openalex.org/W2118629634","https://openalex.org/W2123402141","https://openalex.org/W2131681506","https://openalex.org/W2135303340","https://openalex.org/W2144981148","https://openalex.org/W2147618390","https://openalex.org/W2152239989","https://openalex.org/W2161498332","https://openalex.org/W2164005910","https://openalex.org/W2165874743","https://openalex.org/W2242390630","https://openalex.org/W2281227836","https://openalex.org/W2322006099","https://openalex.org/W2342543340","https://openalex.org/W2503647350","https://openalex.org/W2547512372","https://openalex.org/W2562137041","https://openalex.org/W2611957242","https://openalex.org/W2752667320","https://openalex.org/W2754041971","https://openalex.org/W2762425175","https://openalex.org/W2775152143","https://openalex.org/W2779812635","https://openalex.org/W2785509713","https://openalex.org/W2794407684","https://openalex.org/W2802287725","https://openalex.org/W2804854320","https://openalex.org/W2805044645","https://openalex.org/W2885319825","https://openalex.org/W2904250115","https://openalex.org/W2908338457","https://openalex.org/W2913835110","https://openalex.org/W2914251418","https://openalex.org/W2940897462","https://openalex.org/W2945015580","https://openalex.org/W2970428830","https://openalex.org/W3009013481","https://openalex.org/W3013926312","https://openalex.org/W3016700505","https://openalex.org/W3088303111","https://openalex.org/W3099768174","https://openalex.org/W3106625866","https://openalex.org/W3110476256","https://openalex.org/W3115999643","https://openalex.org/W3131993763","https://openalex.org/W3134735565","https://openalex.org/W3143324940","https://openalex.org/W3153302987","https://openalex.org/W3164872214","https://openalex.org/W3179596469","https://openalex.org/W3201611947","https://openalex.org/W4205364647","https://openalex.org/W4206080966","https://openalex.org/W4206912861","https://openalex.org/W4213163295","https://openalex.org/W4214929190","https://openalex.org/W4230931443","https://openalex.org/W4235169531","https://openalex.org/W6684578312","https://openalex.org/W6806128557"],"related_works":["https://openalex.org/W2122713011","https://openalex.org/W2071729956","https://openalex.org/W2900331548","https://openalex.org/W2965399423","https://openalex.org/W2116758642","https://openalex.org/W4247284515","https://openalex.org/W3141834514","https://openalex.org/W2904519018","https://openalex.org/W2607406914","https://openalex.org/W2969921651"],"abstract_inverted_index":{"In":[0,122,287],"recent":[1],"years,":[2],"unsupervised":[3,119,147],"analysis":[4,12,34,331],"of":[5,33,118,139,151,165,325,341,347],"microbiome":[6,120,142,330],"data,":[7,241,310],"such":[8],"as":[9,179],"microbial":[10,157,160],"network":[11,161,232],"and":[13,22,49,89,163,215,242,284,327,336,350],"clustering,":[14],"has":[15],"increased":[16],"in":[17,115,132,156,329],"popularity.":[18],"Many":[19],"new":[20],"statistical":[21,348],"computational":[23],"methods":[24,56,228],"have":[25,110,176],"been":[26,111],"proposed":[27],"for":[28,39,62,229,352],"these":[29,108,168,187],"tasks.":[30],"This":[31],"multiplicity":[32],"strategies":[35],"poses":[36],"a":[37,140],"challenge":[38],"researchers,":[40],"who":[41,144],"are":[42,72,170,236,279,293,304],"often":[43],"unsure":[44],"which":[45],"method(s)":[46],"to":[47,53,60,85,128,180,199,251,273,307,332],"use":[48],"might":[50,92,174,197,261],"be":[51,93],"tempted":[52],"try":[54],"different":[55],"on":[57,95,238,299],"their":[58],"dataset":[59,207],"look":[61],"the":[63,69,79,86,90,116,137,172,194,209,239,243,247,252,258,269,274,297,300,308,323,339,345],"\"best\"":[64,80,270],"ones.":[65],"However,":[66],"if":[67],"only":[68,262],"best":[70,248],"results":[71,91,278,298,335],"selectively":[73],"reported,":[74],"this":[75,133,264],"may":[76],"cause":[77],"over-optimism:":[78],"method":[81,225,271],"is":[82,255],"overly":[83],"fitted":[84],"specific":[87],"dataset,":[88],"non-replicable":[94],"validation":[96,216,275,285,301,326],"data.":[97,286,318],"Such":[98],"effects":[99,131],"will":[100],"ultimately":[101],"hinder":[102],"research":[103,148,222,290],"progress.":[104],"Yet":[105],"so":[106],"far,":[107],"topics":[109],"given":[112],"little":[113],"attention":[114],"context":[117,346],"analysis.":[121],"our":[123],"illustrative":[124],"study,":[125],"we":[126,266],"aim":[127],"quantify":[129],"over-optimism":[130,295,342],"context.":[134],"We":[135,185,201],"model":[136],"approach":[138],"hypothetical":[141,195,259],"researcher":[143,173,196,260],"undertakes":[145],"four":[146,289],"tasks:":[149],"clustering":[150,164],"bacterial":[152],"genera,":[153],"hub":[154],"detection":[155],"networks,":[158],"differential":[159],"analysis,":[162],"samples.":[166],"While":[167,257],"tasks":[169],"unsupervised,":[171],"still":[175],"certain":[177],"expectations":[178,188],"what":[181],"constitutes":[182],"interesting":[183],"results.":[184],"translate":[186],"into":[189,213,316],"concrete":[190],"evaluation":[191,253],"criteria":[192],"that":[193,245,338],"want":[198],"optimize.":[200],"then":[202,280],"randomly":[203],"split":[204],"an":[205],"exemplary":[206],"from":[208],"American":[210],"Gut":[211],"Project":[212],"discovery":[214,240,283,309],"sets":[217],"multiple":[218,224,313],"times.":[219],"For":[220],"each":[221],"task,":[223],"combinations":[226],"(e.g.,":[227],"data":[230,302],"normalization,":[231],"generation,":[233],"and/or":[234],"clustering)":[235],"tried":[237],"combination":[244,272],"yields":[246],"result":[249],"according":[250],"criterion":[254],"chosen.":[256],"report":[263],"result,":[265],"also":[267],"apply":[268],"dataset.":[276],"The":[277],"compared":[281,306],"between":[282],"all":[288],"tasks,":[291],"there":[292],"notable":[294],"effects;":[296],"set":[303],"worse":[305],"averaged":[311],"over":[312],"random":[314],"splits":[315],"discovery/validation":[317],"Our":[319],"study":[320],"thus":[321],"highlights":[322],"importance":[324],"replication":[328],"obtain":[333],"reliable":[334],"demonstrates":[337],"issue":[340],"goes":[343],"beyond":[344],"testing":[349],"fishing":[351],"significance.":[353]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
