{"id":"https://openalex.org/W2557731459","doi":"https://doi.org/10.1145/2975167.2975174","title":"Reference-free comparison of microbial communities via de Bruijn graphs","display_name":"Reference-free comparison of microbial communities via de Bruijn graphs","publication_year":2016,"publication_date":"2016-10-02","ids":{"openalex":"https://openalex.org/W2557731459","doi":"https://doi.org/10.1145/2975167.2975174","mag":"2557731459"},"language":"en","primary_location":{"id":"doi:10.1145/2975167.2975174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2975167.2975174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Bioinformatics, Computational Biology, and Health Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017101305","display_name":"Serghei Mangul","orcid":"https://orcid.org/0000-0003-4770-3443"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Serghei Mangul","raw_affiliation_strings":["Computer Science Department, University of California, Los Angeles, CA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, University of California, Los Angeles, CA","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002668669","display_name":"David Koslicki","orcid":"https://orcid.org/0000-0002-0640-954X"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Koslicki","raw_affiliation_strings":["Mathematics Department, Oregon State University, Corvallis, OR"],"affiliations":[{"raw_affiliation_string":"Mathematics Department, Oregon State University, Corvallis, OR","institution_ids":["https://openalex.org/I131249849"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5017101305"],"corresponding_institution_ids":["https://openalex.org/I161318765"],"apc_list":null,"apc_paid":null,"fwci":0.3335,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.68512206,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"68","last_page":"77"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10066","display_name":"Gut microbiota and health","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10066","display_name":"Gut microbiota and health","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11791","display_name":"Microbial Community Ecology and Physiology","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/de-bruijn-sequence","display_name":"De Bruijn sequence","score":0.6960174441337585},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.576856255531311},{"id":"https://openalex.org/keywords/de-bruijn-graph","display_name":"De Bruijn graph","score":0.547032356262207},{"id":"https://openalex.org/keywords/microbial-population-biology","display_name":"Microbial population biology","score":0.5118764638900757},{"id":"https://openalex.org/keywords/taxonomic-rank","display_name":"Taxonomic rank","score":0.42271688580513},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38829904794692993},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.38638895750045776},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.37574562430381775},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.31964361667633057},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.31828853487968445},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18109002709388733},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.1185978353023529},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.09884804487228394},{"id":"https://openalex.org/keywords/taxon","display_name":"Taxon","score":0.07805922627449036}],"concepts":[{"id":"https://openalex.org/C170320093","wikidata":"https://www.wikidata.org/wiki/Q1953457","display_name":"De Bruijn sequence","level":2,"score":0.6960174441337585},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.576856255531311},{"id":"https://openalex.org/C20218877","wikidata":"https://www.wikidata.org/wiki/Q3066095","display_name":"De Bruijn graph","level":3,"score":0.547032356262207},{"id":"https://openalex.org/C81407943","wikidata":"https://www.wikidata.org/wiki/Q17149178","display_name":"Microbial population biology","level":3,"score":0.5118764638900757},{"id":"https://openalex.org/C189592816","wikidata":"https://www.wikidata.org/wiki/Q427626","display_name":"Taxonomic rank","level":3,"score":0.42271688580513},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38829904794692993},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.38638895750045776},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37574562430381775},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.31964361667633057},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.31828853487968445},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18109002709388733},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.1185978353023529},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.09884804487228394},{"id":"https://openalex.org/C71640776","wikidata":"https://www.wikidata.org/wiki/Q16521","display_name":"Taxon","level":2,"score":0.07805922627449036},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C523546767","wikidata":"https://www.wikidata.org/wiki/Q10876","display_name":"Bacteria","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2975167.2975174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2975167.2975174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Bioinformatics, Computational Biology, and Health Informatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7200000286102295,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1559169059","https://openalex.org/W2000589358","https://openalex.org/W2009170813","https://openalex.org/W2010002522","https://openalex.org/W2010361633","https://openalex.org/W2016853666","https://openalex.org/W2023574331","https://openalex.org/W2023924471","https://openalex.org/W2034820020","https://openalex.org/W2045449780","https://openalex.org/W2055043387","https://openalex.org/W2078689689","https://openalex.org/W2091232725","https://openalex.org/W2096981901","https://openalex.org/W2097493826","https://openalex.org/W2117727476","https://openalex.org/W2118629634","https://openalex.org/W2128124531","https://openalex.org/W2131026689","https://openalex.org/W2136777606","https://openalex.org/W2140729960","https://openalex.org/W2145336165","https://openalex.org/W2152885278","https://openalex.org/W2158485828","https://openalex.org/W2160969485","https://openalex.org/W2166123725","https://openalex.org/W2170551349","https://openalex.org/W2539033431"],"related_works":["https://openalex.org/W2562683361","https://openalex.org/W3087469195","https://openalex.org/W2354744388","https://openalex.org/W3125399386","https://openalex.org/W2949121831","https://openalex.org/W3215786367","https://openalex.org/W1908987670","https://openalex.org/W2756186577","https://openalex.org/W2735897904","https://openalex.org/W3021341025"],"abstract_inverted_index":{"Microbial":[0],"communities":[1,57,133],"inhabiting":[2],"the":[3,51,75,81,109,131,136,171],"human":[4],"body":[5],"exhibit":[6],"significant":[7],"variability":[8],"across":[9,58,102],"different":[10,59],"individuals":[11],"and":[12,14,24,78,128,154,164,195],"tissues,":[13],"are":[15,184],"suggested":[16],"to":[17,31,53,69,84,96,125,143,160,179,186,191],"play":[18],"an":[19],"important":[20],"role":[21],"in":[22,99,208],"health":[23],"disease.":[25],"High-throughput":[26],"sequencing":[27,82,110],"offers":[28],"unprecedented":[29],"possibilities":[30],"profile":[32],"microbial":[33,47,56,86,100,132,173],"community":[34],"composition,":[35],"but":[36],"limitations":[37,72],"of":[38,45,130],"existing":[39,46],"taxonomic":[40],"classification":[41,76],"methods":[42],"(including":[43],"incompleteness":[44],"reference":[48],"databases)":[49],"limits":[50],"ability":[52],"accurately":[54],"compare":[55,85,176],"samples.":[60,103,197],"In":[61],"this":[62,141,201],"paper,":[63],"we":[64],"present":[65],"a":[66,92,113,148,188,205],"method":[67,90,142],"able":[68,159],"overcome":[70],"these":[71,177],"by":[73],"circumventing":[74],"step":[77],"directly":[79],"using":[80],"data":[83,111,145],"communities.":[87],"The":[88,117],"proposed":[89],"provides":[91],"powerful":[93],"reference-free":[94,202],"way":[95],"assess":[97],"differences":[98,129],"abundances":[101],"This":[104],"method,":[105],"called":[106],"EMDeBruijn,":[107],"condenses":[108],"into":[112],"de":[114],"Bruijn":[115],"graph.":[116],"Earth":[118],"Mover's":[119],"Distance":[120],"(EMD)":[121],"is":[122,158,204],"then":[123],"used":[124],"measure":[126],"similarities":[127],"associated":[134],"with":[135],"individual":[137],"graphs.":[138],"We":[139,175,198],"apply":[140],"RNA-Seq":[144],"sets":[146],"from":[147],"coronary":[149],"artery":[150],"calcification":[151],"(CAC)":[152],"study":[153],"shown":[155,185],"that":[156,200],"EMDeBruijn":[157],"differentiate":[161],"between":[162,193],"case":[163,194],"control":[165,196],"CAC":[166],"samples":[167],"while":[168],"utilizing":[169],"all":[170],"candidate":[172],"reads.":[174],"results":[178],"current":[180],"reference-based":[181],"methods,":[182],"which":[183],"have":[187],"limited":[189],"capacity":[190],"discriminate":[192],"conclude":[199],"approach":[203],"viable":[206],"choice":[207],"comparative":[209],"metatranscriptomic":[210],"studies.":[211]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
