{"id":"https://openalex.org/W2968451579","doi":"https://doi.org/10.1109/cibcb.2019.8791456","title":"Predicting gene expression level in E. coli from mRNA sequence information","display_name":"Predicting gene expression level in E. coli from mRNA sequence information","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2968451579","doi":"https://doi.org/10.1109/cibcb.2019.8791456","mag":"2968451579"},"language":"en","primary_location":{"id":"doi:10.1109/cibcb.2019.8791456","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb.2019.8791456","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Conference on Computational Intelligence in Bioinformatics and Computational Biology (CIBCB)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089603004","display_name":"Linlin Zhao","orcid":"https://orcid.org/0000-0002-8821-4198"},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Linlin Zhao","raw_affiliation_strings":["Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036973535","display_name":"Nima Abedpour","orcid":"https://orcid.org/0000-0002-2933-8035"},"institutions":[{"id":"https://openalex.org/I180923762","display_name":"University of Cologne","ror":"https://ror.org/00rcxh774","country_code":"DE","type":"education","lineage":["https://openalex.org/I180923762"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Nima Abedpour","raw_affiliation_strings":["Department of Translational Genomics, University of Cologne, Cologne, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Translational Genomics, University of Cologne, Cologne, Germany","institution_ids":["https://openalex.org/I180923762"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033823993","display_name":"Christopher Blum","orcid":"https://orcid.org/0009-0003-3663-0362"},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christopher Blum","raw_affiliation_strings":["Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063111257","display_name":"Petra Kolkhof","orcid":null},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Petra Kolkhof","raw_affiliation_strings":["Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016803881","display_name":"Mathias Beller","orcid":"https://orcid.org/0000-0003-0987-0080"},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Mathias Beller","raw_affiliation_strings":["Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110456998","display_name":"Markus Kollmann","orcid":null},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Markus Kollmann","raw_affiliation_strings":["Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, Heinrich Heine University, D\u00fcsseldorf, Germany","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029911656","display_name":"Emidio Capriotti","orcid":"https://orcid.org/0000-0002-2323-0963"},"institutions":[{"id":"https://openalex.org/I9360294","display_name":"University of Bologna","ror":"https://ror.org/01111rn36","country_code":"IT","type":"education","lineage":["https://openalex.org/I9360294"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Emidio Capriotti","raw_affiliation_strings":["Department of Pharmacy and Biotechnology, University of Bologna, Bologna, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Pharmacy and Biotechnology, University of Bologna, Bologna, Italy","institution_ids":["https://openalex.org/I9360294"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0855,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.47638065,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coding-region","display_name":"Coding region","score":0.6138375997543335},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.6129671335220337},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5653917789459229},{"id":"https://openalex.org/keywords/gene-prediction","display_name":"Gene prediction","score":0.49050039052963257},{"id":"https://openalex.org/keywords/gene-expression","display_name":"Gene expression","score":0.4817892909049988},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.46997612714767456},{"id":"https://openalex.org/keywords/ribosomal-binding-site","display_name":"Ribosomal binding site","score":0.4693518579006195},{"id":"https://openalex.org/keywords/eukaryotic-translation","display_name":"Eukaryotic translation","score":0.4441753029823303},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.4354126453399658},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.42234641313552856},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4207892417907715},{"id":"https://openalex.org/keywords/messenger-rna","display_name":"Messenger RNA","score":0.39276301860809326},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.3900047540664673},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3419939875602722},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.2602041959762573},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.24067750573158264}],"concepts":[{"id":"https://openalex.org/C91779695","wikidata":"https://www.wikidata.org/wiki/Q3780824","display_name":"Coding region","level":3,"score":0.6138375997543335},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.6129671335220337},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5653917789459229},{"id":"https://openalex.org/C105565629","wikidata":"https://www.wikidata.org/wiki/Q1248292","display_name":"Gene prediction","level":4,"score":0.49050039052963257},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.4817892909049988},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.46997612714767456},{"id":"https://openalex.org/C114847915","wikidata":"https://www.wikidata.org/wiki/Q16948788","display_name":"Ribosomal binding site","level":5,"score":0.4693518579006195},{"id":"https://openalex.org/C4718897","wikidata":"https://www.wikidata.org/wiki/Q5408698","display_name":"Eukaryotic translation","level":5,"score":0.4441753029823303},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.4354126453399658},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.42234641313552856},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4207892417907715},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.39276301860809326},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.3900047540664673},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3419939875602722},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2602041959762573},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.24067750573158264},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cibcb.2019.8791456","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb.2019.8791456","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Conference on Computational Intelligence in Bioinformatics and Computational Biology (CIBCB)","raw_type":"proceedings-article"},{"id":"pmh:oai:cris.unibo.it:11585/738254","is_oa":false,"landing_page_url":"http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=8782659","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320312852","display_name":"University of Alabama","ror":"https://ror.org/03xrrjk67"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W89691187","https://openalex.org/W1969026947","https://openalex.org/W2008625423","https://openalex.org/W2018645639","https://openalex.org/W2025569664","https://openalex.org/W2035475950","https://openalex.org/W2041882488","https://openalex.org/W2047360542","https://openalex.org/W2051242197","https://openalex.org/W2051482716","https://openalex.org/W2063779182","https://openalex.org/W2065063088","https://openalex.org/W2066753114","https://openalex.org/W2066829062","https://openalex.org/W2085369061","https://openalex.org/W2086561953","https://openalex.org/W2092035637","https://openalex.org/W2100908594","https://openalex.org/W2101234009","https://openalex.org/W2108215151","https://openalex.org/W2113221971","https://openalex.org/W2116687527","https://openalex.org/W2119336718","https://openalex.org/W2134582538","https://openalex.org/W2166064969","https://openalex.org/W2166752189","https://openalex.org/W2170513170","https://openalex.org/W2273190468","https://openalex.org/W6675354045"],"related_works":["https://openalex.org/W2000890478","https://openalex.org/W1985367916","https://openalex.org/W2032956499","https://openalex.org/W1983106607","https://openalex.org/W3214129649","https://openalex.org/W2066551576","https://openalex.org/W2397850191","https://openalex.org/W4239750012","https://openalex.org/W2092265915","https://openalex.org/W2091757533"],"abstract_inverted_index":{"The":[0,116,302],"accurate":[1,51],"characterization":[2],"of":[3,13,25,50,86,90,123,141,175,183,215,240,272,275,304,308],"the":[4,14,23,26,48,55,62,84,87,106,142,148,154,166,171,176,180,184,204,226,251,259,270,273,276,283,305,309],"translational":[5,277],"mechanism":[6],"is":[7,65,160,229],"crucial":[8],"for":[9,40,53,82,147],"enhancing":[10],"our":[11,289,316],"understanding":[12],"relationship":[15],"between":[16],"genotype":[17],"and":[18,38,111,188,247,279],"phenotype.":[19],"In":[20,45,72,207,258],"particular,":[21],"predicting":[22,54,83],"impact":[24],"genetic":[27],"variants":[28,126,140,311],"on":[29,120,203,282,295],"gene":[30,158],"expression":[31,60,306],"will":[32],"allow":[33],"to":[34,105],"optimize":[35],"specific":[36],"pathways":[37],"functions":[39],"engineering":[41],"new":[42,79,310],"biological":[43],"systems.":[44],"this":[46,73,208],"context,":[47],"development":[49],"methods":[52],"translation":[56,88],"efficiency":[57,89,278],"and/or":[58],"protein":[59],"from":[61],"nucleotide":[63],"sequence":[64,93,125,139,162,300],"a":[66,78,121,198,212,218,232,242],"key":[67],"challenge":[68],"in":[69,94,264,269,313,319],"computational":[70],"biology.":[71],"work":[74],"we":[75,136,287],"present":[76],"PGExpress,":[77],"regression":[80,227,260],"method":[81,117,290],"log2-fold-change":[85,274],"an":[91,237,248],"mRNA":[92,299],"E.":[95,130,320],"coli.":[96,321],"PGExpress":[97,210,235,262],"algorithm":[98],"takes":[99],"as":[100,231],"input":[101],"12":[102],"features":[103],"corresponding":[104],"predicted":[107],"RNA":[108],"secondary":[109],"structure":[110],"anti-Shine-Dalgarno":[112],"hybridization":[113],"free":[114],"energies.":[115],"was":[118,195],"trained":[119,196],"set":[122],"1,772":[124],"(WT-High)of":[127],"137":[128],"essential":[129],"coli":[131],"genes.":[132],"For":[133],"each":[134],"gene,":[135],"considered":[137],"13":[138],"first":[143,172],"33":[144,173],"nucleotides":[145,174],"encoding":[146],"same":[149],"amino":[150],"acids":[151],"followed":[152],"by":[153,291],"superfolder":[155],"GFP.":[156],"Each":[157],"variant":[159],"represented":[161],"blocks":[163],"that":[164],"include":[165],"Ribosome":[167],"Binding":[168],"Site":[169],"(RBS),":[170],"coding":[177,185],"region":[178,186],"(C33),":[179],"remaining":[181],"part":[182],"(CC),":[187],"their":[189],"combinations.":[190],"Our":[191],"gradient-boosting-based":[192],"tool":[193],"(PGExpress)":[194],"using":[197],"10-fold":[199],"gene-based":[200],"cross-validation":[201],"procedure":[202],"WT-High":[205,284],"dataset.":[206,285],"test":[209],"achieved":[211],"correlation":[213,244],"coefficient":[214,245],"0.60,":[216],"with":[217,315],"Root":[219],"Mean":[220],"Square":[221],"Error":[222],"(RMSE)of":[223],"1.3.":[224],"When":[225],"task":[228],"cast":[230],"classification":[233],"problem,":[234],"reached":[236],"overall":[238],"accuracy":[239],"0.74":[241],"Matthews":[243],"0.48":[246],"Area":[249],"Under":[250],"Receiver":[252],"Operating":[253],"Characteristic":[254],"Curve":[255],"(AUC)of":[256],"0.81.":[257],"task,":[261],"results":[263,318],"better":[265],"performance":[266],"than":[267],"RBSCalculator":[268],"prediction":[271],"its":[280],"variation":[281],"Finally,":[286],"validated":[288],"performing":[292],"in-house":[293],"experiments":[294],"five":[296],"newly":[297],"generated":[298],"variants.":[301],"predictions":[303],"level":[307],"are":[312],"agreement":[314],"experimental":[317]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2019-08-22T00:00:00"}
