{"id":"https://openalex.org/W4220984910","doi":"https://doi.org/10.1186/s13040-022-00291-0","title":"mSRFR: a machine learning model using microalgal signature features for ncRNA classification","display_name":"mSRFR: a machine learning model using microalgal signature features for ncRNA classification","publication_year":2022,"publication_date":"2022-03-21","ids":{"openalex":"https://openalex.org/W4220984910","doi":"https://doi.org/10.1186/s13040-022-00291-0","pmid":"https://pubmed.ncbi.nlm.nih.gov/35313925"},"language":"en","primary_location":{"id":"doi:10.1186/s13040-022-00291-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-022-00291-0","pdf_url":"https://biodatamining.biomedcentral.com/track/pdf/10.1186/s13040-022-00291-0","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://biodatamining.biomedcentral.com/track/pdf/10.1186/s13040-022-00291-0","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000972158","display_name":"Songtham Anuntakarun","orcid":"https://orcid.org/0000-0002-6849-0523"},"institutions":[{"id":"https://openalex.org/I60837268","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056","country_code":"TH","type":"education","lineage":["https://openalex.org/I60837268"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Songtham Anuntakarun","raw_affiliation_strings":["Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand","School of Information Technology, KMUTT, Bang Mod, Thung Khru, Bangkok, 10140, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand","institution_ids":["https://openalex.org/I60837268"]},{"raw_affiliation_string":"School of Information Technology, KMUTT, Bang Mod, Thung Khru, Bangkok, 10140, Thailand","institution_ids":["https://openalex.org/I60837268"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027545777","display_name":"Supatcha Lertampaiporn","orcid":"https://orcid.org/0000-0002-8465-847X"},"institutions":[{"id":"https://openalex.org/I1332092204","display_name":"National Science and Technology Development Agency","ror":"https://ror.org/04vy95b61","country_code":"TH","type":"government","lineage":["https://openalex.org/I1332092204"]},{"id":"https://openalex.org/I60837268","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056","country_code":"TH","type":"education","lineage":["https://openalex.org/I60837268"]},{"id":"https://openalex.org/I902798049","display_name":"National Center for Genetic Engineering and Biotechnology","ror":"https://ror.org/047aswc67","country_code":"TH","type":"facility","lineage":["https://openalex.org/I1332092204","https://openalex.org/I902798049"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Supatcha Lertampaiporn","raw_affiliation_strings":["Biochemical Engineering and Systems Biology Research Group, National Center for Genetic Engineering and Biotechnology (BIOTEC), National Science and Technology Development Agency at King Mongkut's University of Technology Thonburi, Bang Khun Thian, Bangkok, 10150, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Biochemical Engineering and Systems Biology Research Group, National Center for Genetic Engineering and Biotechnology (BIOTEC), National Science and Technology Development Agency at King Mongkut's University of Technology Thonburi, Bang Khun Thian, Bangkok, 10150, Thailand","institution_ids":["https://openalex.org/I1332092204","https://openalex.org/I60837268","https://openalex.org/I902798049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013407366","display_name":"Teeraphan Laomettachit","orcid":"https://orcid.org/0000-0003-3194-1391"},"institutions":[{"id":"https://openalex.org/I60837268","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056","country_code":"TH","type":"education","lineage":["https://openalex.org/I60837268"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Teeraphan Laomettachit","raw_affiliation_strings":["Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand","institution_ids":["https://openalex.org/I60837268"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087961585","display_name":"Warin Wattanapornprom","orcid":"https://orcid.org/0000-0002-9710-6893"},"institutions":[{"id":"https://openalex.org/I60837268","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056","country_code":"TH","type":"education","lineage":["https://openalex.org/I60837268"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Warin Wattanapornprom","raw_affiliation_strings":["Department of Mathematics, Faculty of Science, KMUTT, Bangkok, 10140, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematics, Faculty of Science, KMUTT, Bangkok, 10140, Thailand","institution_ids":["https://openalex.org/I60837268"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015959832","display_name":"Marasri Ruengjitchatchawalya","orcid":"https://orcid.org/0000-0003-2872-7757"},"institutions":[{"id":"https://openalex.org/I60837268","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056","country_code":"TH","type":"education","lineage":["https://openalex.org/I60837268"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Marasri Ruengjitchatchawalya","raw_affiliation_strings":["Algal Biotechnology Research Group, Pilot Plant Development and Training Institute (PDTI), KMUTT, Bang Khun Thian, Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","Biotechnology program, School of Bioresources and Technology, KMUTT, Bang Khun Thian, Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand"],"raw_orcid":"https://orcid.org/0000-0003-2872-7757","affiliations":[{"raw_affiliation_string":"Algal Biotechnology Research Group, Pilot Plant Development and Training Institute (PDTI), KMUTT, Bang Khun Thian, Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","institution_ids":["https://openalex.org/I60837268"]},{"raw_affiliation_string":"Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","institution_ids":["https://openalex.org/I60837268"]},{"raw_affiliation_string":"Biotechnology program, School of Bioresources and Technology, KMUTT, Bang Khun Thian, Bangkok, 10150, Thailand. marasri.rue@kmutt.ac.th","institution_ids":["https://openalex.org/I60837268"]},{"raw_affiliation_string":"Bioinformatics and Systems Biology Program, School of Bioresources and Technology, King Mongkut's University of Technology Thonburi (KMUTT), Bangkok, 10150, Thailand","institution_ids":["https://openalex.org/I60837268"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5000972158"],"corresponding_institution_ids":["https://openalex.org/I60837268"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":0.868,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.70490249,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"15","issue":"1","first_page":"8","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12388","display_name":"Identification and Quantification in Food","score":0.9706000089645386,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10506","display_name":"Aquaculture disease management and microbiota","score":0.9420999884605408,"subfield":{"id":"https://openalex.org/subfields/2403","display_name":"Immunology"},"field":{"id":"https://openalex.org/fields/24","display_name":"Immunology and Microbiology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7355800867080688},{"id":"https://openalex.org/keywords/signature","display_name":"Signature (topology)","score":0.7190839648246765},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.610158383846283},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5859482288360596},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.38546323776245117},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3325777053833008},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09612682461738586}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7355800867080688},{"id":"https://openalex.org/C2779696439","wikidata":"https://www.wikidata.org/wiki/Q7512811","display_name":"Signature (topology)","level":2,"score":0.7190839648246765},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.610158383846283},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5859482288360596},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.38546323776245117},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3325777053833008},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09612682461738586},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1186/s13040-022-00291-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-022-00291-0","pdf_url":"https://biodatamining.biomedcentral.com/track/pdf/10.1186/s13040-022-00291-0","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},{"id":"pmid:35313925","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35313925","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData mining","raw_type":null},{"id":"pmh:oai:doaj.org/article:7efbd85573cd4b3ebce6d30245bb5b84","is_oa":true,"landing_page_url":"https://doaj.org/article/7efbd85573cd4b3ebce6d30245bb5b84","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BioData Mining, Vol 15, Iss 1, Pp 1-11 (2022)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:8935802","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/8935802","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BioData Min","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13040-022-00291-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13040-022-00291-0","pdf_url":"https://biodatamining.biomedcentral.com/track/pdf/10.1186/s13040-022-00291-0","source":{"id":"https://openalex.org/S84409260","display_name":"BioData Mining","issn_l":"1756-0381","issn":["1756-0381"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BioData Mining","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15","score":0.7300000190734863}],"awards":[{"id":"https://openalex.org/G7286301589","display_name":null,"funder_award_id":"P18-51620","funder_id":"https://openalex.org/F4320326787","funder_display_name":"National Center for Genetic Engineering and Biotechnology"}],"funders":[{"id":"https://openalex.org/F4320322818","display_name":"King Mongkut's University of Technology Thonburi","ror":"https://ror.org/0057ax056"},{"id":"https://openalex.org/F4320326787","display_name":"National Center for Genetic Engineering and Biotechnology","ror":"https://ror.org/047aswc67"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4220984910.pdf","grobid_xml":"https://content.openalex.org/works/W4220984910.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W1967102258","https://openalex.org/W1984780475","https://openalex.org/W1996998725","https://openalex.org/W2008108163","https://openalex.org/W2041856473","https://openalex.org/W2051725773","https://openalex.org/W2060313313","https://openalex.org/W2061548680","https://openalex.org/W2075320162","https://openalex.org/W2083588045","https://openalex.org/W2091489934","https://openalex.org/W2094686600","https://openalex.org/W2102764178","https://openalex.org/W2107994759","https://openalex.org/W2111785130","https://openalex.org/W2115787060","https://openalex.org/W2124050695","https://openalex.org/W2132166479","https://openalex.org/W2133990480","https://openalex.org/W2161364752","https://openalex.org/W2468596032","https://openalex.org/W2509738156","https://openalex.org/W2605614336","https://openalex.org/W2615786037","https://openalex.org/W2795896985","https://openalex.org/W2810474688","https://openalex.org/W2914698725","https://openalex.org/W2944543839","https://openalex.org/W2968812970"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4313488044","https://openalex.org/W3209574120","https://openalex.org/W4312192474","https://openalex.org/W2033914206"],"abstract_inverted_index":{"This":[0],"work":[1],"presents":[2],"mSRFR":[3],"(microalgae":[4],"SMOTE":[5,29],"Random":[6,103,127,139],"Forest":[7,128,140],"Relief":[8,81,185],"model),":[9],"a":[10,63,92,159,166,192],"classification":[11],"tool":[12],"for":[13],"noncoding":[14],"RNAs":[15],"(ncRNAs)":[16],"in":[17,51,173],"microalgae,":[18],"including":[19,68,149],"green":[20],"algae,":[21,24],"diatoms,":[22],"golden":[23],"and":[25,73,111,144,154,165,207],"cyanobacteria.":[26],"First,":[27],"the":[28,35,42,52,57,80,96,116,126,131,138,175,181,188],"technique":[30],"was":[31,88,142],"applied":[32,89],"to":[33,41,90,200],"address":[34],"challenge":[36],"of":[37,45,65,135,162,170,178,195],"imbalanced":[38],"data":[39],"due":[40],"different":[43,49],"numbers":[44],"microalgae":[46],"ncRNAs":[47,197],"from":[48,62,184],"species":[50],"EBI":[53],"RNA-central":[54],"database.":[55],"Then":[56],"top":[58,182],"20":[59],"significant":[60],"features":[61,183],"total":[64],"106":[66],"features,":[67,76],"sequence-based,":[69],"secondary":[70],"structure,":[71],"base-pair,":[72],"triplet":[74],"sequence-structure":[75],"were":[77],"selected":[78,143],"using":[79],"feature":[82,194],"selection":[83],"method.":[84],"Next,":[85],"ten-fold":[86],"cross-validation":[87],"choose":[91],"classifier":[93,129],"algorithm":[94,141],"with":[95,146],"highest":[97,132],"performance":[98],"among":[99],"Support":[100],"Vector":[101],"Machine,":[102],"Forest,":[104],"Decision":[105],"Tree,":[106],"Na\u00efve":[107],"Bayes,":[108],"K-nearest":[109],"Neighbor,":[110],"Neural":[112],"Network,":[113],"based":[114],"on":[115],"receiver":[117],"operating":[118],"characteristic":[119],"(ROC)":[120],"area.":[121],"The":[122],"results":[123],"showed":[124],"that":[125,187],"achieved":[130,158],"ROC":[133],"area":[134],"0.992.":[136],"Then,":[137],"compared":[145,199],"other":[147],"tools,":[148],"RNAcon,":[150],"CPC,":[151],"CPC2,":[152],"CNCI,":[153],"CPPred.":[155],"Our":[156],"model":[157],"high":[160],"accuracy":[161],"about":[163,171],"97%":[164],"low":[167],"false-positive":[168],"rate":[169],"2%":[172],"predicting":[174],"test":[176],"dataset":[177],"microalgae.":[179],"Furthermore,":[180],"revealed":[186],"%GA":[189],"dinucleotide":[190],"is":[191],"signature":[193],"microalgal":[196],"when":[198],"Escherichia":[201],"coli,":[202],"Saccharomyces":[203],"cerevisiae,":[204],"Arabidopsis":[205],"thaliana,":[206],"Homo":[208],"sapiens.":[209]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
