{"id":"https://openalex.org/W7135387579","doi":"https://doi.org/10.1021/acs.jcim.6c00056","title":"ncProFormer: A CNN-enhanced Transformer for ncRNA Coding-Potential Prediction","display_name":"ncProFormer: A CNN-enhanced Transformer for ncRNA Coding-Potential Prediction","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7135387579","doi":"https://doi.org/10.1021/acs.jcim.6c00056","pmid":"https://pubmed.ncbi.nlm.nih.gov/41830618"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.6c00056","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.6c00056","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072355113","display_name":"Mengyu Tong","orcid":"https://orcid.org/0000-0002-1404-9943"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyu Tong","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015797870","display_name":"Yuanting Chen","orcid":"https://orcid.org/0000-0003-1294-479X"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanting Chen","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129161396","display_name":"Long Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Long Chen","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101856485","display_name":"Jiayi Xu","orcid":"https://orcid.org/0000-0003-3465-7927"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingnan Xu","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129278847","display_name":"Yingjie Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingjie Yang","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101576373","display_name":"Guixia Liu","orcid":"https://orcid.org/0000-0001-9648-844X"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guixia Liu","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":"https://orcid.org/0000-0001-9648-844X","affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129289079","display_name":"Weihua Li","orcid":null},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weihua Li","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":"https://orcid.org/0000-0001-7055-9836","affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080564633","display_name":"Y. S. Tang","orcid":"https://orcid.org/0000-0003-2340-1109"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yun Tang","raw_affiliation_strings":["Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China"],"raw_orcid":"https://orcid.org/0000-0003-2340-1109","affiliations":[{"raw_affiliation_string":"Shanghai Frontiers Science Center of Optogenetic Techniques for Cell Metabolism, Shanghai Key Laboratory of New Drug Design, School of Pharmacy, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"State Key Laboratory of Bioreactor Engineering, East China University of Science and Technology, 130 Meilong Road, Shanghai 200237, China","institution_ids":["https://openalex.org/I143593769"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5080564633"],"corresponding_institution_ids":["https://openalex.org/I143593769"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.55070871,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"66","issue":"7","first_page":"3713","last_page":"3724"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10062","display_name":"MicroRNA in disease regulation","score":0.1363999992609024,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10062","display_name":"MicroRNA in disease regulation","score":0.1363999992609024,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.10580000281333923,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12131","display_name":"Wireless Signal Modulation Classification","score":0.07370000332593918,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.48510000109672546},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2847000062465668},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.24289999902248383}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5609999895095825},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.48510000109672546},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4350999891757965},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42500001192092896},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32749998569488525},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2939999997615814},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2847000062465668},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.24420000612735748},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.24289999902248383},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.2273000031709671}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D022661","descriptor_name":"RNA, Untranslated","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D051379","descriptor_name":"Mice","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D051381","descriptor_name":"Rats","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.6c00056","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.6c00056","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:41830618","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41830618","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G177194081","display_name":null,"funder_award_id":"U23A20530","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1980401374","https://openalex.org/W1998422171","https://openalex.org/W2037837681","https://openalex.org/W2048194168","https://openalex.org/W2052503008","https://openalex.org/W2075320162","https://openalex.org/W2139658526","https://openalex.org/W2156125289","https://openalex.org/W2165423269","https://openalex.org/W2175136759","https://openalex.org/W2544360569","https://openalex.org/W2615786037","https://openalex.org/W2886900083","https://openalex.org/W2896457183","https://openalex.org/W2914698725","https://openalex.org/W2951413354","https://openalex.org/W2962784628","https://openalex.org/W2999743161","https://openalex.org/W3013495013","https://openalex.org/W3040739508","https://openalex.org/W3081143873","https://openalex.org/W3095583226","https://openalex.org/W3127238141","https://openalex.org/W3146944767","https://openalex.org/W3202397671","https://openalex.org/W4225858649","https://openalex.org/W4322008681","https://openalex.org/W4380080316","https://openalex.org/W4382681032","https://openalex.org/W4385799332","https://openalex.org/W4388979610","https://openalex.org/W4396676543","https://openalex.org/W4400652889","https://openalex.org/W4400981600","https://openalex.org/W4401305288","https://openalex.org/W4401458581","https://openalex.org/W4403647236","https://openalex.org/W4406419344"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"studies":[1],"have":[2,16],"revealed":[3],"that":[4,141],"some":[5],"noncoding":[6],"RNAs":[7],"(ncRNAs)":[8],"bear":[9],"translational":[10],"potential,":[11],"and":[12,38,72,87,136,148,156,167],"their":[13],"encoded":[14],"micropeptides":[15],"essential":[17],"functions":[18,186],"in":[19,122],"multiple":[20],"biological":[21,144],"processes.":[22],"However,":[23],"accurate":[24],"identification":[25],"of":[26,175],"coding-capable":[27],"ncRNAs":[28],"remains":[29],"challenging":[30],"due":[31],"to":[32,62,81],"weak":[33],"translation":[34],"signals,":[35],"low":[36],"conservation,":[37],"heterogeneous":[39],"data":[40,100,105,111,138],"distributions.":[41],"Herein,":[42],"we":[43],"propose":[44],"ncProFormer,":[45],"a":[46,74,179],"deep":[47],"learning":[48],"framework":[49,169],"tailored":[50],"for":[51,170,183],"ncRNA":[52,123,185],"coding-potential":[53,124],"prediction.":[54,125],"ncProFormer":[55,90,128,163],"integrates":[56],"the":[57,93,97,102,107,118,142,153,172],"nucleic-acid":[58],"language":[59],"model":[60],"GENA-LM":[61],"obtain":[63],"contextual":[64],"sequence":[65],"embeddings,":[66],"adopts":[67],"an":[68,165],"all-token":[69],"representation":[70],"strategy,":[71],"employs":[73],"convolutional":[75],"neural":[76],"network":[77],"(CNN)-enhanced":[78],"transformer":[79],"encoder":[80],"jointly":[82],"capture":[83],"local":[84],"nucleotide":[85],"patterns":[86],"long-range":[88],"dependencies.":[89],"consistently":[91],"outperformed":[92],"existing":[94],"methods":[95],"across":[96,187],"in-house":[98],"human":[99],"set,":[101,106],"external":[103],"validation":[104],"public":[108],"CPPred":[109],"benchmark":[110],"set.":[112],"More":[113],"importantly,":[114],"this":[115],"study":[116],"presents":[117],"first":[119],"cross-species":[120,157],"evaluation":[121],"Without":[126],"retraining,":[127],"maintained":[129],"its":[130],"strong":[131],"predictive":[132],"performance":[133],"on":[134],"mouse":[135],"rat":[137],"sets,":[139],"showing":[140],"learned":[143],"representations":[145],"are":[146],"transferable":[147],"it":[149],"is":[150],"robust":[151],"under":[152],"distributional":[154],"shift":[155],"conditions.":[158],"Collectively,":[159],"these":[160],"findings":[161],"establish":[162],"as":[164],"effective":[166],"generalizable":[168],"uncovering":[171],"coding":[173],"potential":[174],"ncRNAs,":[176],"thus":[177],"offering":[178],"promising":[180],"computational":[181],"tool":[182],"characterizing":[184],"diverse":[188],"transcriptomic":[189],"contexts.":[190]},"counts_by_year":[],"updated_date":"2026-04-14T06:02:45.956762","created_date":"2026-03-15T00:00:00"}
