{"id":"https://openalex.org/W2043602518","doi":"https://doi.org/10.1186/1471-2105-9-419","title":"A database of phylogenetically atypical genes in archaeal and bacterial genomes, identified using the DarkHorse algorithm","display_name":"A database of phylogenetically atypical genes in archaeal and bacterial genomes, identified using the DarkHorse algorithm","publication_year":2008,"publication_date":"2008-10-07","ids":{"openalex":"https://openalex.org/W2043602518","doi":"https://doi.org/10.1186/1471-2105-9-419","mag":"2043602518","pmid":"https://pubmed.ncbi.nlm.nih.gov/18840280"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-9-419","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-419","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-419","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-419","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044467135","display_name":"Sheila Podell","orcid":"https://orcid.org/0000-0001-7073-5190"},"institutions":[{"id":"https://openalex.org/I150209017","display_name":"Scripps Institution of Oceanography","ror":"https://ror.org/04v7hvq31","country_code":"US","type":"facility","lineage":["https://openalex.org/I150209017","https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sheila Podell","raw_affiliation_strings":["Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA 92093 USA. spodell@ucsd.edu","Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA 92093 USA. spodell@ucsd.edu","institution_ids":["https://openalex.org/I150209017"]},{"raw_affiliation_string":"Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA","institution_ids":["https://openalex.org/I150209017"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080777434","display_name":"Terry Gaasterland","orcid":"https://orcid.org/0000-0003-4023-9342"},"institutions":[{"id":"https://openalex.org/I150209017","display_name":"Scripps Institution of Oceanography","ror":"https://ror.org/04v7hvq31","country_code":"US","type":"facility","lineage":["https://openalex.org/I150209017","https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Terry Gaasterland","raw_affiliation_strings":["Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA","institution_ids":["https://openalex.org/I150209017"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049116965","display_name":"Eric E. Allen","orcid":"https://orcid.org/0000-0002-1229-8794"},"institutions":[{"id":"https://openalex.org/I150209017","display_name":"Scripps Institution of Oceanography","ror":"https://ror.org/04v7hvq31","country_code":"US","type":"facility","lineage":["https://openalex.org/I150209017","https://openalex.org/I36258959"]},{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eric E Allen","raw_affiliation_strings":["Division of Biological Sciences, University of California at San Diego, La Jolla, CA, 92093, USA","Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Biological Sciences, University of California at San Diego, La Jolla, CA, 92093, USA","institution_ids":["https://openalex.org/I36258959"]},{"raw_affiliation_string":"Marine Biology Research Division, Scripps Institution of Oceanography University of California at San Diego, La Jolla, CA, 92093, USA","institution_ids":["https://openalex.org/I150209017"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5044467135"],"corresponding_institution_ids":["https://openalex.org/I150209017"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":0.9815,"has_fulltext":true,"cited_by_count":45,"citation_normalized_percentile":{"value":0.74688114,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"9","issue":"1","first_page":"419","last_page":"419"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.7178999781608582,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.7178999781608582,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T13664","display_name":"Genome Rearrangement Algorithms","score":0.17669999599456787,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10120","display_name":"Bacterial Genetics and Biotechnology","score":0.03460000082850456,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.7630200386047363},{"id":"https://openalex.org/keywords/phylogenetic-tree","display_name":"Phylogenetic tree","score":0.7496170401573181},{"id":"https://openalex.org/keywords/horizontal-gene-transfer","display_name":"Horizontal gene transfer","score":0.6289986371994019},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.6258573532104492},{"id":"https://openalex.org/keywords/refseq","display_name":"RefSeq","score":0.6220231056213379},{"id":"https://openalex.org/keywords/bacterial-genome-size","display_name":"Bacterial genome size","score":0.6053395867347717},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.5301419496536255},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.4950698912143707},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.48911625146865845},{"id":"https://openalex.org/keywords/phylogenetics","display_name":"Phylogenetics","score":0.47484830021858215},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.45441755652427673},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4526859521865845},{"id":"https://openalex.org/keywords/dna-microarray","display_name":"DNA microarray","score":0.4498365521430969},{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.43098539113998413},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.16370338201522827}],"concepts":[{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.7630200386047363},{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.7496170401573181},{"id":"https://openalex.org/C92938381","wikidata":"https://www.wikidata.org/wiki/Q83185","display_name":"Horizontal gene transfer","level":4,"score":0.6289986371994019},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.6258573532104492},{"id":"https://openalex.org/C151810110","wikidata":"https://www.wikidata.org/wiki/Q7307074","display_name":"RefSeq","level":4,"score":0.6220231056213379},{"id":"https://openalex.org/C3742359","wikidata":"https://www.wikidata.org/wiki/Q4839988","display_name":"Bacterial genome size","level":4,"score":0.6053395867347717},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.5301419496536255},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.4950698912143707},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.48911625146865845},{"id":"https://openalex.org/C90132467","wikidata":"https://www.wikidata.org/wiki/Q171184","display_name":"Phylogenetics","level":3,"score":0.47484830021858215},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.45441755652427673},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4526859521865845},{"id":"https://openalex.org/C95371953","wikidata":"https://www.wikidata.org/wiki/Q591745","display_name":"DNA microarray","level":4,"score":0.4498365521430969},{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.43098539113998413},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.16370338201522827},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001482","descriptor_name":"Base Composition","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D001482","descriptor_name":"Base Composition","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D001482","descriptor_name":"Base Composition","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D010802","descriptor_name":"Phylogeny","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D014584","descriptor_name":"User-Computer Interface","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D014584","descriptor_name":"User-Computer Interface","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D014584","descriptor_name":"User-Computer Interface","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016680","descriptor_name":"Genome, Bacterial","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016680","descriptor_name":"Genome, Bacterial","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016680","descriptor_name":"Genome, Bacterial","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017422","descriptor_name":"Sequence Analysis, DNA","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020745","descriptor_name":"Genome, Archaeal","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020745","descriptor_name":"Genome, Archaeal","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020745","descriptor_name":"Genome, Archaeal","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D022761","descriptor_name":"Gene Transfer, Horizontal","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D022761","descriptor_name":"Gene Transfer, Horizontal","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D022761","descriptor_name":"Gene Transfer, Horizontal","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1186/1471-2105-9-419","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-419","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-419","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:18840280","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/18840280","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:0c2857d46145473d93cc1dd010967ca0","is_oa":true,"landing_page_url":"https://doaj.org/article/0c2857d46145473d93cc1dd010967ca0","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 9, Iss 1, p 419 (2008)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:2573894","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2573894","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-9-419","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-419","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-419","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306202","display_name":"Gordon and Betty Moore Foundation","ror":"https://ror.org/006wxqw41"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2043602518.pdf","grobid_xml":"https://content.openalex.org/works/W2043602518.grobid-xml"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W1964343317","https://openalex.org/W1993470051","https://openalex.org/W1995249986","https://openalex.org/W2017470100","https://openalex.org/W2024011853","https://openalex.org/W2028626290","https://openalex.org/W2039158827","https://openalex.org/W2069502786","https://openalex.org/W2124817677","https://openalex.org/W2126730752","https://openalex.org/W2139636599","https://openalex.org/W2140703422","https://openalex.org/W2146622826","https://openalex.org/W2147667803","https://openalex.org/W2150471837","https://openalex.org/W2163420689"],"related_works":["https://openalex.org/W2051969447","https://openalex.org/W3035691570","https://openalex.org/W2111937814","https://openalex.org/W25489809","https://openalex.org/W2162923930","https://openalex.org/W1788797176","https://openalex.org/W3212385379","https://openalex.org/W1482324242","https://openalex.org/W2133116680","https://openalex.org/W2091678889"],"abstract_inverted_index":{"BACKGROUND:":[0],"The":[1,122,187,246],"process":[2],"of":[3,31,48,156,256,294],"horizontal":[4,111,295],"gene":[5,112,296],"transfer":[6,113],"(HGT)":[7],"is":[8,21,232,299],"believed":[9],"to":[10,53,75,128,158,204,225,234,265],"be":[11,223,306,322],"widespread":[12],"in":[13,26,182,271,313],"Bacteria":[14],"and":[15,98,133,274,281],"Archaea,":[16],"but":[17],"little":[18],"comparative":[19],"data":[20,36],"available":[22,101,233],"addressing":[23],"its":[24,99],"occurrence":[25],"complete":[27],"microbial":[28,130],"genomes.":[29,219],"Collection":[30],"high-quality,":[32],"automated":[33],"HGT":[34,145,208,248,269,276],"prediction":[35],"based":[37],"on":[38,68],"phylogenetic":[39,90,238],"evidence":[40],"has":[41,125],"previously":[42],"been":[43,126],"impractical":[44],"for":[45,63,164,193,258],"large":[46],"numbers":[47],"genomes":[49,153,157],"at":[50],"once,":[51],"due":[52],"prohibitive":[54],"computational":[55],"demands.":[56],"DarkHorse,":[57],"a":[58,69,73,93,138,236,252,300],"recently":[59],"described":[60],"statistical":[61],"method":[62],"discovering":[64],"phylogenetically":[65,212,260],"atypical":[66,215,261],"genes":[67],"genome-wide":[70],"basis,":[71],"provides":[72,251],"means":[74],"solve":[76],"this":[77],"problem":[78],"through":[79],"lineage":[80],"probability":[81],"index":[82],"(LPI)":[83],"ranking":[84],"scores.":[85],"LPI":[86,107,161,191],"scores":[87,108,118,192],"inversely":[88],"reflect":[89],"distance":[91],"between":[92],"test":[94],"amino":[95,171],"acid":[96,172],"sequence":[97,173],"closest":[100],"database":[102,250],"matches.":[103],"Proteins":[104],"with":[105,116,178,308],"low":[106],"are":[109,119,211],"good":[110],"candidates;":[114],"those":[115],"high":[117],"not.":[120],"DESCRIPTION:":[121],"DarkHorse":[123,144,247,286],"algorithm":[124,287],"applied":[127],"955":[129],"genome":[131,282],"sequences,":[132,200],"the":[134,143,202,241,285],"results":[135],"organized":[136],"into":[137],"web-searchable":[139],"relational":[140],"database,":[141],"called":[142],"Candidate":[146,249],"Resource":[147],"http://darkhorse.ucsd.edu.":[148],"Users":[149],"can":[150,222,305],"select":[151,176],"individual":[152,268],"or":[154,170,175,214,228],"groups":[155],"screen":[159],"by":[160,167,289],"score,":[162],"search":[163,188],"protein":[165,279],"functions":[166],"descriptive":[168],"annotation":[169],"similarity,":[174],"proteins":[177],"unusual":[179],"G+C":[180],"composition":[181],"their":[183,217],"underlying":[184],"coding":[185],"sequences.":[186],"engine":[189],"reports":[190],"match":[194],"partners":[195],"as":[196,198],"well":[197],"query":[199],"providing":[201],"opportunity":[203],"explore":[205,266],"whether":[206,227],"potential":[207,242],"donor":[209,243],"sequences":[210],"typical":[213],"within":[216],"own":[218],"This":[220],"information":[221,231],"used":[224],"predict":[226],"not":[229,320],"sufficient":[230],"build":[235],"well-supported":[237],"tree":[239],"using":[240],"sequence.":[244],"CONCLUSION:":[245],"powerful,":[253],"flexible":[254],"set":[255],"tools":[257],"identifying":[259],"proteins,":[262],"allowing":[263],"researchers":[264],"both":[267],"events":[270],"single":[272],"genomes,":[273],"large-scale":[275],"patterns":[277],"among":[278],"families":[280],"groups.":[283],"Although":[284],"cannot,":[288],"itself,":[290],"provide":[291],"definitive":[292],"proof":[293],"transfer,":[297],"it":[298],"flexible,":[301],"powerful":[302],"tool":[303],"that":[304],"combined":[307],"slower,":[309],"more":[310],"rigorous":[311],"methods":[312,318],"situations":[314],"where":[315],"these":[316],"other":[317],"could":[319],"otherwise":[321],"applied.":[323]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":3}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
