{"id":"https://openalex.org/W7126234854","doi":"https://doi.org/10.1186/s12859-026-06386-3","title":"Srnc: semi-supervised learning for robust novel cell-type identification in single cell RNA sequencing data","display_name":"Srnc: semi-supervised learning for robust novel cell-type identification in single cell RNA sequencing data","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7126234854","doi":"https://doi.org/10.1186/s12859-026-06386-3","pmid":"https://pubmed.ncbi.nlm.nih.gov/41618152"},"language":"en","primary_location":{"id":"doi:10.1186/s12859-026-06386-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-026-06386-3","pdf_url":null,"source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1186/s12859-026-06386-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Thi Van Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I70349855","display_name":"Vietnam Academy of Science and Technology","ror":"https://ror.org/02wsd5p50","country_code":"VN","type":"government","lineage":["https://openalex.org/I70349855"]},{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Thi Van Nguyen","raw_affiliation_strings":["University of Science and Technology of Hanoi, Vietnam Academy of Science and Technology, Hanoi, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of Hanoi, Vietnam Academy of Science and Technology, Hanoi, Vietnam","institution_ids":["https://openalex.org/I94518387","https://openalex.org/I70349855"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072375949","display_name":"Van Hoan","orcid":"https://orcid.org/0000-0001-9098-109X"},"institutions":[{"id":"https://openalex.org/I131359167","display_name":"Le Quy Don Technical University","ror":"https://ror.org/04wgyjv21","country_code":"VN","type":"education","lineage":["https://openalex.org/I131359167"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Van Hoan Do","raw_affiliation_strings":["Center for Applied Mathematics and Informatics, Le Quy Don Technical University, Hanoi, Vietnam"],"affiliations":[{"raw_affiliation_string":"Center for Applied Mathematics and Informatics, Le Quy Don Technical University, Hanoi, Vietnam","institution_ids":["https://openalex.org/I131359167"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083724281","display_name":"Vu-Linh Nguyen","orcid":"https://orcid.org/0000-0003-1642-4468"},"institutions":[{"id":"https://openalex.org/I102516824","display_name":"Universit\u00e9 de Technologie de Compi\u00e8gne","ror":"https://ror.org/04y5kwa70","country_code":"FR","type":"education","lineage":["https://openalex.org/I102516824"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Vu-Linh Nguyen","raw_affiliation_strings":["UMR CNRS 7253, Heudiasyc, Sorbonne Universite, Universit\u00e9 de Technologie de Compi\u00e8gne, Compi\u00e8gne, France. vu-linh.nguyen@hds.utc.fr"],"affiliations":[{"raw_affiliation_string":"UMR CNRS 7253, Heudiasyc, Sorbonne Universite, Universit\u00e9 de Technologie de Compi\u00e8gne, Compi\u00e8gne, France. vu-linh.nguyen@hds.utc.fr","institution_ids":["https://openalex.org/I102516824","https://openalex.org/I39804081","https://openalex.org/I1294671590"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5083724281"],"corresponding_institution_ids":["https://openalex.org/I102516824","https://openalex.org/I1294671590","https://openalex.org/I39804081"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.29564589,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11287","display_name":"Cancer Genomics and Diagnostics","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7455000281333923},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6230999827384949},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5909000039100647},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5181999802589417},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.43529999256134033},{"id":"https://openalex.org/keywords/dna-microarray","display_name":"DNA microarray","score":0.36640000343322754},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3650999963283539},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.3573000133037567}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7455000281333923},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7372999787330627},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6836000084877014},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6340000033378601},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6230999827384949},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5909000039100647},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5181999802589417},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.43529999256134033},{"id":"https://openalex.org/C95371953","wikidata":"https://www.wikidata.org/wiki/Q591745","display_name":"DNA microarray","level":4,"score":0.36640000343322754},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3650999963283539},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.3573000133037567},{"id":"https://openalex.org/C189014844","wikidata":"https://www.wikidata.org/wiki/Q189118","display_name":"Cell type","level":3,"score":0.3343999981880188},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3328999876976013},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3248000144958496},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.27790001034736633},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1186/s12859-026-06386-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-026-06386-3","pdf_url":null,"source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:41618152","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41618152","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:a6c9853f401043a2a3682633efd1d638","is_oa":true,"landing_page_url":"https://doaj.org/article/a6c9853f401043a2a3682633efd1d638","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 27, Iss 1 (2026)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:12934016","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12934016/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s12859-026-06386-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-026-06386-3","pdf_url":null,"source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1979283544","https://openalex.org/W2030017878","https://openalex.org/W2033403400","https://openalex.org/W2051658465","https://openalex.org/W2068881679","https://openalex.org/W2071128523","https://openalex.org/W2118377301","https://openalex.org/W2135253885","https://openalex.org/W2294798173","https://openalex.org/W2523369352","https://openalex.org/W2523419694","https://openalex.org/W2523620612","https://openalex.org/W2526262591","https://openalex.org/W2531252525","https://openalex.org/W2783512689","https://openalex.org/W2803144214","https://openalex.org/W2808837841","https://openalex.org/W2947877009","https://openalex.org/W2949829455","https://openalex.org/W2963855710","https://openalex.org/W2971653850","https://openalex.org/W2995410603","https://openalex.org/W3013823153","https://openalex.org/W3014596384","https://openalex.org/W3092982430","https://openalex.org/W3103797259","https://openalex.org/W3130098356","https://openalex.org/W3132715010","https://openalex.org/W3173017111","https://openalex.org/W4235169531","https://openalex.org/W4322768301","https://openalex.org/W4362521490","https://openalex.org/W4379521442","https://openalex.org/W4400073242","https://openalex.org/W4406298433","https://openalex.org/W4406437131","https://openalex.org/W4411670013"],"related_works":[],"abstract_inverted_index":{"Single-cell":[0],"RNA":[1],"sequencing":[2],"(scRNA-seq)":[3],"enables":[4],"the":[5,39,142],"identification":[6,89],"of":[7,237],"cell":[8,21,34,46,79,103,166,201,228],"types":[9,22,35],"within":[10],"complex":[11],"biological":[12],"systems,":[13],"yet":[14],"accurately":[15,163],"classifying":[16],"both":[17,115,141,197],"known":[18,198],"and":[19,117,138,145,157,181,199,216,233],"novel":[20,78,92,200],"remains":[23],"a":[24,91,179,222],"significant":[25],"challenge.":[26],"Supervised":[27],"learning":[28,84,109],"methods":[29,170,205],"perform":[30],"well":[31],"when":[32],"all":[33],"are":[36],"labeled":[37,116],"in":[38,159,187,206],"training":[40],"data,":[41],"but":[42,54,71],"struggle":[43],"with":[44,110],"unseen":[45],"types,":[47,202,229],"while":[48,99],"rejection-based":[49,143],"approaches":[50],"can":[51],"mitigate":[52],"misclassification":[53],"fail":[55],"to":[56,77,120,212],"leverage":[57],"unlabeled":[58,118],"data":[59,119],"for":[60,85,184,225],"learning.":[61],"Deep":[62],"learning-based":[63],"methods,":[64,133],"such":[65],"as":[66],"MARS,":[67],"offer":[68],"promising":[69],"solutions":[70],"often":[72,171],"suffer":[73],"from":[74,154],"poor":[75],"generalization":[76],"populations.":[80],"We":[81],"propose":[82],"Semi-supervised":[83],"Robust":[86],"Novel":[87],"Cell-type":[88],"(SRNC),":[90],"semi-supervised":[93,111,192],"framework":[94],"that":[95,168,176],"enhances":[96],"classification":[97,161,186],"accuracy":[98],"effectively":[100,195],"identifying":[101,164],"unknown":[102],"types.":[104],"By":[105,190],"integrating":[106],"self-supervised":[107],"feature":[108],"classification,":[112],"SRNC":[113,129,149,177,194],"leverages":[114],"improve":[121],"generalization.":[122],"Evaluated":[123],"across":[124,152,214],"six":[125],"benchmark":[126],"scRNA-seq":[127,188],"datasets,":[128],"consistently":[130],"outperforms":[131],"state-of-the-art":[132],"achieving":[134],"higher":[135],"ARI,":[136],"F1-score,":[137],"precision":[139,231],"than":[140],"approach":[144,224],"deep-learning-based":[146],"MARS.":[147],"Moreover,":[148],"demonstrates":[150],"robustness":[151],"datasets":[153,215],"different":[155],"laboratories":[156],"excels":[158],"imbalanced":[160],"scenarios,":[162],"rare":[165],"populations":[167],"other":[169],"misclassify.":[172],"Our":[173],"results":[174],"demonstrate":[175],"is":[178],"powerful":[180],"adaptable":[182],"tool":[183],"cell-type":[185],"analysis.":[189],"leveraging":[191],"learning,":[193],"identifies":[196],"surpassing":[203],"competing":[204],"multiple":[207],"performance":[208],"metrics.":[209],"Its":[210],"ability":[211],"generalize":[213],"handle":[217],"class":[218],"imbalances":[219],"makes":[220],"it":[221],"valuable":[223],"discovering":[226],"new":[227],"advancing":[230],"medicine,":[232],"improving":[234],"our":[235],"understanding":[236],"cellular":[238],"heterogeneity.":[239]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-02-01T00:00:00"}
