{"id":"https://openalex.org/W2908351833","doi":"https://doi.org/10.1093/bioinformatics/bty1068","title":"Promoter analysis and prediction in the human genome using sequence-based deep learning models","display_name":"Promoter analysis and prediction in the human genome using sequence-based deep learning models","publication_year":2018,"publication_date":"2018-12-27","ids":{"openalex":"https://openalex.org/W2908351833","doi":"https://doi.org/10.1093/bioinformatics/bty1068","mag":"2908351833","pmid":"https://pubmed.ncbi.nlm.nih.gov/30601980"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/bty1068","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bioinformatics/bty1068","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033647731","display_name":"Ramzan Umarov","orcid":"https://orcid.org/0000-0003-3477-7101"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Ramzan Umarov","raw_affiliation_strings":["Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005997934","display_name":"Hiroyuki Kuwahara","orcid":"https://orcid.org/0000-0001-5333-6729"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Hiroyuki Kuwahara","raw_affiliation_strings":["Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100345753","display_name":"Yu Li","orcid":"https://orcid.org/0000-0002-3664-6722"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Yu Li","raw_affiliation_strings":["Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia"],"raw_orcid":"https://orcid.org/0000-0002-3664-6722","affiliations":[{"raw_affiliation_string":"Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100618900","display_name":"Xin Gao","orcid":"https://orcid.org/0000-0002-7108-3574"},"institutions":[{"id":"https://openalex.org/I71920554","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38","country_code":"SA","type":"education","lineage":["https://openalex.org/I71920554"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Xin Gao","raw_affiliation_strings":["Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computational Bioscience Research Center, Computer, Electrical and Mathematical Sciences and Engineering Division, King Abdullah University of Science and Technology, Thuwal, Saudi Arabia","institution_ids":["https://openalex.org/I71920554"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019821677","display_name":"Victor Solovyev","orcid":"https://orcid.org/0000-0001-8885-493X"},"institutions":[{"id":"https://openalex.org/I4210116466","display_name":"Institute of Cytology and Genetics","ror":"https://ror.org/0277xgb12","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I1313323035","https://openalex.org/I188973947","https://openalex.org/I4210116466","https://openalex.org/I4210127387","https://openalex.org/I4210129690"]},{"id":"https://openalex.org/I4210127387","display_name":"Siberian Branch of the Russian Academy of Sciences","ror":"https://ror.org/02frkq021","country_code":"RU","type":"funder","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210127387"]}],"countries":["RU"],"is_corresponding":true,"raw_author_name":"Victor Solovyev","raw_affiliation_strings":["Department of Cell Biology, Institute of Cytology and Genetics SB RAS, Novosibirsk, Russia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Cell Biology, Institute of Cytology and Genetics SB RAS, Novosibirsk, Russia","institution_ids":["https://openalex.org/I4210116466","https://openalex.org/I4210127387"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5019821677","https://openalex.org/A5100618900"],"corresponding_institution_ids":["https://openalex.org/I4210116466","https://openalex.org/I4210127387","https://openalex.org/I71920554"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":5.6582,"has_fulltext":false,"cited_by_count":123,"citation_normalized_percentile":{"value":0.97031517,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"35","issue":"16","first_page":"2730","last_page":"2737"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.5127999782562256,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.5127999782562256,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.4480000138282776,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.007899999618530273,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/promoter","display_name":"Promoter","score":0.7076292634010315},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6783415079116821},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5757536292076111},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5608214139938354},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5513267517089844},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5103537440299988},{"id":"https://openalex.org/keywords/human-genome","display_name":"Human genome","score":0.5103535056114197},{"id":"https://openalex.org/keywords/dna-binding-site","display_name":"DNA binding site","score":0.44230926036834717},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.4288049042224884},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3916390538215637},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.35107094049453735},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34744369983673096},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.3365744352340698},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.29097065329551697},{"id":"https://openalex.org/keywords/gene-expression","display_name":"Gene expression","score":0.12509188055992126}],"concepts":[{"id":"https://openalex.org/C101762097","wikidata":"https://www.wikidata.org/wiki/Q224093","display_name":"Promoter","level":4,"score":0.7076292634010315},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6783415079116821},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5757536292076111},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5608214139938354},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5513267517089844},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5103537440299988},{"id":"https://openalex.org/C197077220","wikidata":"https://www.wikidata.org/wiki/Q720988","display_name":"Human genome","level":4,"score":0.5103535056114197},{"id":"https://openalex.org/C3662595","wikidata":"https://www.wikidata.org/wiki/Q5205743","display_name":"DNA binding site","level":5,"score":0.44230926036834717},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.4288049042224884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3916390538215637},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.35107094049453735},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34744369983673096},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.3365744352340698},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.29097065329551697},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.12509188055992126},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011401","descriptor_name":"Promoter Regions, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011401","descriptor_name":"Promoter Regions, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011401","descriptor_name":"Promoter Regions, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015894","descriptor_name":"Genome, Human","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015894","descriptor_name":"Genome, Human","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015894","descriptor_name":"Genome, Human","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D024363","descriptor_name":"Transcription Initiation Site","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D024363","descriptor_name":"Transcription Initiation Site","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D024363","descriptor_name":"Transcription Initiation Site","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":3,"locations":[{"id":"doi:10.1093/bioinformatics/bty1068","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bioinformatics/bty1068","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:30601980","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/30601980","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics (Oxford, England)","raw_type":null},{"id":"pmh:oai:repository.kaust.edu.sa:10754/630783","is_oa":false,"landing_page_url":"http://hdl.handle.net/10754/630783","pdf_url":null,"source":{"id":"https://openalex.org/S4306401596","display_name":"King Abdullah University of Science and Technology Repository (King Abdullah University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I71920554","host_organization_name":"King Abdullah University of Science and Technology","host_organization_lineage":["https://openalex.org/I71920554"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7099999785423279,"display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322320","display_name":"King Abdullah University of Science and Technology","ror":"https://ror.org/01q3tbs38"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1491459594","https://openalex.org/W1522301498","https://openalex.org/W1971456303","https://openalex.org/W1989471545","https://openalex.org/W1989843455","https://openalex.org/W1993502678","https://openalex.org/W2001280003","https://openalex.org/W2027349221","https://openalex.org/W2029492292","https://openalex.org/W2033831809","https://openalex.org/W2067116931","https://openalex.org/W2083073732","https://openalex.org/W2095705004","https://openalex.org/W2102582209","https://openalex.org/W2113197426","https://openalex.org/W2126939295","https://openalex.org/W2130395351","https://openalex.org/W2137458297","https://openalex.org/W2147380886","https://openalex.org/W2148503087","https://openalex.org/W2154854793","https://openalex.org/W2159164310","https://openalex.org/W2169351355","https://openalex.org/W2170698318","https://openalex.org/W2170798594","https://openalex.org/W2464717012","https://openalex.org/W2557250028","https://openalex.org/W2558947257","https://openalex.org/W2567174107","https://openalex.org/W2578532919","https://openalex.org/W2579909079","https://openalex.org/W2746992081","https://openalex.org/W2765741842","https://openalex.org/W2806965771","https://openalex.org/W2952020316","https://openalex.org/W2963739921","https://openalex.org/W6631190155","https://openalex.org/W6674330103","https://openalex.org/W6752660601"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2761785940","https://openalex.org/W2110523656","https://openalex.org/W1482209366","https://openalex.org/W2521627374"],"abstract_inverted_index":{"MOTIVATION:":[0],"Computational":[1],"identification":[2,36],"of":[3,19,71,85,143,151,167],"promoters":[4,101],"is":[5,161,178],"notoriously":[6],"difficult":[7],"as":[8,180],"human":[9,100,169],"genes":[10],"often":[11],"have":[12,39,147,154],"unique":[13],"promoter":[14,35,66,135,170],"sequences":[15,93],"that":[16,59],"provide":[17],"regulation":[18],"transcription":[20,24,87],"and":[21,67,108,153],"interaction":[22],"with":[23],"initiation":[25],"complex.":[26],"While":[27],"there":[28],"are":[29],"many":[30],"attempts":[31],"to":[32,43,63,102],"develop":[33,54],"computational":[34],"methods,":[37],"we":[38,52,80],"no":[40],"reliable":[41],"tool":[42],"analyze":[44],"long":[45],"genomic":[46,92],"sequences.":[47,69],"RESULTS:":[48],"In":[49],"this":[50,78],"work,":[51],"further":[53],"our":[55],"deep":[56,111],"learning":[57,112],"approach":[58],"was":[60],"relatively":[61],"successful":[62],"discriminate":[64],"short":[65],"non-promoter":[68],"Instead":[70],"focusing":[72],"on":[73],"the":[74,82,86,91,124,132,141,165],"classification":[75],"accuracy,":[76],"in":[77],"work":[79],"predict":[81],"exact":[83],"positions":[84],"start":[88],"site":[89],"inside":[90],"testing":[94],"every":[95],"possible":[96],"location.":[97],"We":[98,146],"studied":[99],"find":[103],"effective":[104],"regions":[105],"for":[106],"discrimination":[107],"built":[109],"corresponding":[110],"models.":[113],"These":[114],"models":[115],"use":[116],"adaptively":[117],"constructed":[118],"negative":[119],"set,":[120],"which":[121,160],"iteratively":[122],"improves":[123],"model's":[125],"discriminative":[126],"ability.":[127],"Our":[128],"method":[129,177],"significantly":[130,162],"outperforms":[131],"previously":[133],"developed":[134,176],"prediction":[136],"programs":[137],"by":[138],"considerably":[139],"reducing":[140],"number":[142],"false-positive":[144],"predictions.":[145],"achieved":[148],"error-per-1000-bp":[149],"rate":[150],"0.02":[152],"0.31":[155],"errors":[156],"per":[157],"correct":[158],"prediction,":[159],"better":[163],"than":[164],"results":[166],"other":[168],"predictors.":[171],"AVAILABILITY":[172],"AND":[173],"IMPLEMENTATION:":[174],"The":[175],"available":[179],"a":[181],"web":[182],"server":[183],"at":[184],"http://www.cbrc.kaust.edu.sa/PromID/.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":19},{"year":2022,"cited_by_count":20},{"year":2021,"cited_by_count":27},{"year":2020,"cited_by_count":19},{"year":2019,"cited_by_count":13}],"updated_date":"2026-05-25T08:39:21.599409","created_date":"2025-10-10T00:00:00"}
