{"id":"https://openalex.org/W4412605485","doi":"https://doi.org/10.1109/tcbbio.2025.3591871","title":"CrisprDA: A Data Augmentation Method Enhancing the Efficiency of sgRNA on-Target Activity Prediction","display_name":"CrisprDA: A Data Augmentation Method Enhancing the Efficiency of sgRNA on-Target Activity Prediction","publication_year":2025,"publication_date":"2025-07-23","ids":{"openalex":"https://openalex.org/W4412605485","doi":"https://doi.org/10.1109/tcbbio.2025.3591871","pmid":"https://pubmed.ncbi.nlm.nih.gov/40811280"},"language":"en","primary_location":{"id":"doi:10.1109/tcbbio.2025.3591871","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbbio.2025.3591871","pdf_url":null,"source":{"id":"https://openalex.org/S5407042751","display_name":"IEEE Transactions on Computational Biology and Bioinformatics","issn_l":"2998-4165","issn":["2998-4165"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009077174","display_name":"Liqiao Chen","orcid":"https://orcid.org/0000-0003-0138-7828"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hao Chen","raw_affiliation_strings":["School of Computer Science and Technology, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062917336","display_name":"Zhenran Jiang","orcid":"https://orcid.org/0000-0002-5275-3632"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenran Jiang","raw_affiliation_strings":["School of Computer Science and Technology, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5009077174"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19641178,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"22","issue":"5","first_page":"2313","last_page":"2319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10207","display_name":"Advanced biosensing and bioanalysis techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10207","display_name":"Advanced biosensing and bioanalysis techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10725","display_name":"RNA Interference and Gene Delivery","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9728999733924866,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43619441986083984}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43619441986083984}],"mesh":[{"descriptor_ui":"D000072669","descriptor_name":"Gene Editing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D000072669","descriptor_name":"Gene Editing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D000072669","descriptor_name":"Gene Editing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D000094704","descriptor_name":"RNA, Guide, CRISPR-Cas Systems","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D064113","descriptor_name":"CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D064113","descriptor_name":"CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D064113","descriptor_name":"CRISPR-Cas Systems","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcbbio.2025.3591871","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbbio.2025.3591871","pdf_url":null,"source":{"id":"https://openalex.org/S5407042751","display_name":"IEEE Transactions on Computational Biology and Bioinformatics","issn_l":"2998-4165","issn":["2998-4165"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},{"id":"pmid:40811280","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40811280","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on computational biology and bioinformatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1903088142","https://openalex.org/W1982846895","https://openalex.org/W1982873976","https://openalex.org/W1988101725","https://openalex.org/W2003171404","https://openalex.org/W2045435533","https://openalex.org/W2096261947","https://openalex.org/W2461013690","https://openalex.org/W2810756255","https://openalex.org/W2902305894","https://openalex.org/W2973312556","https://openalex.org/W2984059576","https://openalex.org/W2999201570","https://openalex.org/W3005962315","https://openalex.org/W3034029360","https://openalex.org/W3039159245","https://openalex.org/W3194399644","https://openalex.org/W4200249739","https://openalex.org/W4220962329","https://openalex.org/W4225646954","https://openalex.org/W4292091702","https://openalex.org/W4293094353","https://openalex.org/W4310276384","https://openalex.org/W4317437864","https://openalex.org/W4385079970","https://openalex.org/W4388979610","https://openalex.org/W4404038467"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"The":[0],"CRISPR/Cas9":[1],"system":[2,17],"has":[3,51],"emerged":[4],"as":[5],"a":[6,76,97,116],"revolutionary":[7],"technology":[8],"in":[9,56,84,170],"genome":[10],"editing,":[11],"yet":[12,78],"the":[13,22,53,67,105,130,160,175,180],"efficiency":[14],"of":[15,25,69,109,133,162,179],"this":[16,63],"is":[18,89],"often":[19],"limited":[20],"by":[21,91],"activity":[23],"level":[24],"single-guide":[26],"RNAs":[27],"(sgRNAs).":[28],"In":[29],"recent":[30],"years,":[31],"deep":[32,70],"learning":[33,71],"models":[34],"have":[35],"been":[36],"increasingly":[37],"utilized":[38],"to":[39,102,166],"predict":[40],"sgRNA":[41,59,134],"targeting":[42],"activity.":[43,60,135],"Notably,":[44],"data":[45,80,182],"scarcity":[46],"rather":[47],"than":[48],"model":[49],"architecture":[50,119],"become":[52],"predominant":[54],"bottleneck":[55],"accurately":[57],"predicting":[58],"To":[61],"overcome":[62],"challenge":[64],"and":[65,107,143,164,177],"enhance":[66],"performance":[68],"models,":[72],"we":[73,113],"propose":[74],"Automix,":[75],"straightforward":[77],"effective":[79],"augmentation":[81,183],"method":[82,88],"grounded":[83],"autoencoder":[85],"technology.":[86],"This":[87],"complemented":[90],"CNLC":[92,165],"(Confidence-based":[93],"Nearest":[94],"Label":[95],"Correction),":[96],"pseudo-label":[98],"correction":[99],"technique":[100],"designed":[101],"improve":[103],"both":[104],"quality":[106],"quantity":[108],"training":[110],"data.":[111],"Additionally,":[112],"develop":[114],"CrisprDA,":[115],"novel":[117],"parallel":[118],"that":[120,148],"integrates":[121],"convolutional":[122],"neural":[123],"networks":[124],"(CNNs)":[125],"with":[126],"attention":[127],"mechanisms,":[128],"for":[129],"precise":[131],"prediction":[132],"Comprehensive":[136],"experiments":[137,172],"conducted":[138],"on":[139],"nine":[140],"high-throughput":[141],"datasets":[142,146],"eight":[144],"functional":[145],"demonstrate":[147],"CrisprDA":[149],"outperforms":[150],"five":[151],"compared":[152],"methods,":[153],"showing":[154],"its":[155],"superior":[156],"predictive":[157],"ability.":[158],"Moreover,":[159],"application":[161],"Automix":[163],"other":[167],"comparative":[168],"methods":[169],"our":[171],"further":[173],"validates":[174],"effectiveness":[176],"generalizability":[178],"proposed":[181],"strategy.":[184]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
