{"id":"https://openalex.org/W2126880537","doi":"https://doi.org/10.1109/cibcb.2007.4221215","title":"Operon Prediction in Microbial Genomes Using Decision Tree Approach","display_name":"Operon Prediction in Microbial Genomes Using Decision Tree Approach","publication_year":2007,"publication_date":"2007-04-01","ids":{"openalex":"https://openalex.org/W2126880537","doi":"https://doi.org/10.1109/cibcb.2007.4221215","mag":"2126880537"},"language":"en","primary_location":{"id":"doi:10.1109/cibcb.2007.4221215","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb.2007.4221215","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Symposium on Computational Intelligence and Bioinformatics and Computational Biology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101612165","display_name":"Dongsheng Che","orcid":"https://orcid.org/0000-0002-3086-6513"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dongsheng Che","raw_affiliation_strings":["Department of Computer Science, University of Georgia, Athens, GA, USA","Dept. of Comput. Sci., Georgia Univ., Athens, GA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Georgia Univ., Athens, GA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076081661","display_name":"Jizhen Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jizhen Zhao","raw_affiliation_strings":["Department of Computer Science, University of Georgia, Athens, GA, USA","Dept. of Comput. Sci., Georgia Univ., Athens, GA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Georgia Univ., Athens, GA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012513857","display_name":"Liming Cai","orcid":"https://orcid.org/0000-0002-8982-2435"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Liming Cai","raw_affiliation_strings":["Department of Computer Science, University of Georgia, Athens, GA, USA","Dept. of Comput. Sci., Georgia Univ., Athens, GA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Georgia Univ., Athens, GA","institution_ids":["https://openalex.org/I165733156"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020171946","display_name":"Ying Xu","orcid":"https://orcid.org/0000-0002-7856-3343"},"institutions":[{"id":"https://openalex.org/I165733156","display_name":"University of Georgia","ror":"https://ror.org/00te3t702","country_code":"US","type":"education","lineage":["https://openalex.org/I165733156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ying Xu","raw_affiliation_strings":["Department of Biochemistry and Molecular Biology, and Institute of Bioinformatics, University of Georgia, Athens, GA, USA","Department of Biochemistry and Molecular Biology, and Institute of Bioinformatics, University of Georgia, Athens, GA 30602. Email: xyn@bmb.uga.edu"],"affiliations":[{"raw_affiliation_string":"Department of Biochemistry and Molecular Biology, and Institute of Bioinformatics, University of Georgia, Athens, GA, USA","institution_ids":["https://openalex.org/I165733156"]},{"raw_affiliation_string":"Department of Biochemistry and Molecular Biology, and Institute of Bioinformatics, University of Georgia, Athens, GA 30602. Email: xyn@bmb.uga.edu","institution_ids":["https://openalex.org/I165733156"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101612165"],"corresponding_institution_ids":["https://openalex.org/I165733156"],"apc_list":null,"apc_paid":null,"fwci":0.5236,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.65584557,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"135","last_page":"142"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/operon","display_name":"Operon","score":0.812640905380249},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.5300236344337463},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5299153327941895},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.529435396194458},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47513654828071594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4660530984401703},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.46423378586769104},{"id":"https://openalex.org/keywords/phylogenetic-tree","display_name":"Phylogenetic tree","score":0.4355052709579468},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.41221123933792114},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3556719422340393},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.35109442472457886},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.3462936580181122},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.34258633852005005},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.29338255524635315},{"id":"https://openalex.org/keywords/escherichia-coli","display_name":"Escherichia coli","score":0.1900513768196106}],"concepts":[{"id":"https://openalex.org/C203075996","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operon","level":4,"score":0.812640905380249},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.5300236344337463},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5299153327941895},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.529435396194458},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47513654828071594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4660530984401703},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.46423378586769104},{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.4355052709579468},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.41221123933792114},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3556719422340393},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35109442472457886},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.3462936580181122},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.34258633852005005},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.29338255524635315},{"id":"https://openalex.org/C547475151","wikidata":"https://www.wikidata.org/wiki/Q25419","display_name":"Escherichia coli","level":3,"score":0.1900513768196106}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cibcb.2007.4221215","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb.2007.4221215","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Symposium on Computational Intelligence and Bioinformatics and Computational Biology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life in Land","score":0.699999988079071,"id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306352","display_name":"Georgia Cancer Coalition","ror":"https://ror.org/0009gvn90"},{"id":"https://openalex.org/F4320337393","display_name":"Division of Chemistry","ror":"https://ror.org/01ar8dr59"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1514308025","https://openalex.org/W1570448133","https://openalex.org/W1990453950","https://openalex.org/W2025853251","https://openalex.org/W2029112298","https://openalex.org/W2064384066","https://openalex.org/W2096731969","https://openalex.org/W2102199998","https://openalex.org/W2102498314","https://openalex.org/W2104724853","https://openalex.org/W2105792118","https://openalex.org/W2106913956","https://openalex.org/W2107337820","https://openalex.org/W2107424557","https://openalex.org/W2118552280","https://openalex.org/W2119571185","https://openalex.org/W2121899130","https://openalex.org/W2125055259","https://openalex.org/W2128923603","https://openalex.org/W2130150648","https://openalex.org/W2132867976","https://openalex.org/W2142967149","https://openalex.org/W2146270437","https://openalex.org/W2148973980","https://openalex.org/W2152824658","https://openalex.org/W6631011338","https://openalex.org/W6674388619"],"related_works":["https://openalex.org/W2771255398","https://openalex.org/W3200027047","https://openalex.org/W2966195860","https://openalex.org/W4224922629","https://openalex.org/W3125536479","https://openalex.org/W4385770464","https://openalex.org/W2930428186","https://openalex.org/W4214820172","https://openalex.org/W4386984454","https://openalex.org/W3120363735"],"abstract_inverted_index":{"Identifying":[0],"operons":[1,110],"at":[2,193],"the":[3,175,180],"whole":[4,40],"genome":[5,41],"scale":[6],"of":[7,13,22,43,46,68,89,105,108,113],"microbial":[8],"organisms":[9],"can":[10],"facilitate":[11],"deciphering":[12],"transcriptional":[14],"regulation,":[15],"biological":[16],"networks":[17],"and":[18,29,97,101,111,119,125,146,164],"pathways.":[19],"A":[20],"number":[21,45],"computational":[23],"methods,":[24],"such":[25,58],"as":[26,59],"naive":[27,160],"Bayesian":[28],"neural":[30,162],"network":[31,163],"approaches,":[32],"have":[33],"been":[34],"employed":[35],"for":[36,142,148,183],"operon":[37,83,184],"prediction":[38,138],"to":[39,53,81,133],"sequences":[42],"a":[44,77],"prokaryotic":[47],"organisms,":[48],"based":[49,129],"on":[50,130,168],"features":[51],"known":[52,109],"be":[54],"associated":[55],"with":[56],"operons,":[57],"intergenic":[60,92],"distance,":[61,93],"microarray":[62],"expression":[63],"data,":[64],"phylogenetic":[65],"profiles,":[66],"clusters":[67],"orthologous":[69],"groups":[70],"(COG).":[71],"In":[72],"this":[73],"paper,":[74],"we":[75],"introduce":[76],"decision":[78,127,176],"tree":[79,177],"approach":[80,178],"predict":[82,134],"structures":[84],"using":[85],"three":[86],"effective":[87],"types":[88],"genomic":[90],"data:":[91],"gene":[94],"order":[95],"conservation":[96],"COG.":[98],"We":[99,152],"calculated":[100],"analyzed":[102],"frequency":[103],"distributions":[104],"each":[106],"attribute":[107],"non-operons":[112],"Escherichia":[114],"coli":[115,144],"(E.":[116],"coli)":[117],"K12":[118,145],"Bacillus":[120],"subtilis":[121,150],"(R":[122],"subtilis)":[123],"168,":[124],"constructed":[126],"trees":[128],"training":[131],"examples":[132],"operons.":[135],"The":[136,171,186],"overall":[137],"accuracy":[139],"is":[140,179,190],"94.1%":[141],"E.":[143],"91.0%":[147],"B.":[149],"168.":[151],"also":[153],"applied":[154],"four":[155],"other":[156],"classifiers,":[157],"logistic":[158],"regression,":[159],"Bayesian,":[161],"support":[165],"vector":[166],"machines":[167],"both":[169],"organisms.":[170],"results":[172],"indicate":[173],"that":[174],"best":[181],"classifier":[182],"prediction.":[185],"software":[187],"package":[188],"operonDT":[189],"freely":[191],"available":[192],"http://www.cs.uga.edn/~che/OperonT":[194]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
