{"id":"https://openalex.org/W4402068402","doi":"https://doi.org/10.1142/s0219720024500227","title":"SAKit: An all-in-one analysis pipeline for identifying novel proteins resulting from variant events at both large and small scales","display_name":"SAKit: An all-in-one analysis pipeline for identifying novel proteins resulting from variant events at both large and small scales","publication_year":2024,"publication_date":"2024-08-30","ids":{"openalex":"https://openalex.org/W4402068402","doi":"https://doi.org/10.1142/s0219720024500227","pmid":"https://pubmed.ncbi.nlm.nih.gov/39573833"},"language":"en","primary_location":{"id":"doi:10.1142/s0219720024500227","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720024500227","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100439148","display_name":"Yan Li","orcid":"https://orcid.org/0000-0003-0316-7810"},"institutions":[{"id":"https://openalex.org/I200296433","display_name":"Chinese Academy of Medical Sciences & Peking Union Medical College","ror":"https://ror.org/02drdmm93","country_code":"CN","type":"education","lineage":["https://openalex.org/I200296433"]},{"id":"https://openalex.org/I2801228662","display_name":"Peking Union Medical College Hospital","ror":"https://ror.org/04jztag35","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I2801228662"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yan Li","raw_affiliation_strings":["Department of Breast Surgery, Peking Union Medical College Hospital, Peking Union Medical College, Chinese Academy of Medical Sciences, Beijing 100730, P. R. China"],"raw_orcid":"https://orcid.org/0000-0003-0316-7810","affiliations":[{"raw_affiliation_string":"Department of Breast Surgery, Peking Union Medical College Hospital, Peking Union Medical College, Chinese Academy of Medical Sciences, Beijing 100730, P. R. China","institution_ids":["https://openalex.org/I200296433","https://openalex.org/I2801228662"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Boran Wang","orcid":"https://orcid.org/0009-0005-2879-7212"},"institutions":[{"id":"https://openalex.org/I183519381","display_name":"Capital Medical University","ror":"https://ror.org/013xs5b60","country_code":"CN","type":"education","lineage":["https://openalex.org/I183519381"]},{"id":"https://openalex.org/I4210087691","display_name":"Beijing Tian Tan Hospital","ror":"https://ror.org/003regz62","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210087691"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boran Wang","raw_affiliation_strings":["Beijing Tiantan Hospital, Capital Medical University, Beijing 100070, P. R. China"],"raw_orcid":"https://orcid.org/0009-0005-2879-7212","affiliations":[{"raw_affiliation_string":"Beijing Tiantan Hospital, Capital Medical University, Beijing 100070, P. R. China","institution_ids":["https://openalex.org/I4210087691","https://openalex.org/I183519381"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021917650","display_name":"Zengding Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zengding Wu","raw_affiliation_strings":["Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China"],"raw_orcid":"https://orcid.org/0009-0004-7989-1164","affiliations":[{"raw_affiliation_string":"Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067609757","display_name":"Shiliang Ji","orcid":"https://orcid.org/0000-0002-0393-1324"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiliang Ji","raw_affiliation_strings":["State Key Laboratory of Pharmaceutical Biotechnology, School of Life Sciences, Nanjing University, Nanjing 210023, P. R. China"],"raw_orcid":"https://orcid.org/0000-0002-0393-1324","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Pharmaceutical Biotechnology, School of Life Sciences, Nanjing University, Nanjing 210023, P. R. China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102127167","display_name":"Shi Xu","orcid":"https://orcid.org/0000-0002-8815-9707"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi Xu","raw_affiliation_strings":["Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China"],"raw_orcid":"https://orcid.org/0000-0002-8815-9707","affiliations":[{"raw_affiliation_string":"Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070740466","display_name":"Caiyi Fei","orcid":"https://orcid.org/0000-0001-8726-7063"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Caiyi Fei","raw_affiliation_strings":["Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China"],"raw_orcid":"https://orcid.org/0000-0001-8726-7063","affiliations":[{"raw_affiliation_string":"Department of AI and Bioinformatics, Nanjing Chengshi Biopharmaceutical (TheraRNA) Co., Ltd., Nanjing, P. R. China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100439148"],"corresponding_institution_ids":["https://openalex.org/I200296433","https://openalex.org/I2801228662"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12564144,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"22","issue":"05","first_page":"2450022","last_page":"2450022"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6758949756622314},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6127222776412964},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5455611944198608},{"id":"https://openalex.org/keywords/download","display_name":"Download","score":0.4759100079536438},{"id":"https://openalex.org/keywords/library-science","display_name":"Library science","score":0.4132674038410187},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.38899946212768555},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3454105257987976},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10466238856315613}],"concepts":[{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6758949756622314},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6127222776412964},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5455611944198608},{"id":"https://openalex.org/C2780154274","wikidata":"https://www.wikidata.org/wiki/Q7126717","display_name":"Download","level":2,"score":0.4759100079536438},{"id":"https://openalex.org/C161191863","wikidata":"https://www.wikidata.org/wiki/Q199655","display_name":"Library science","level":1,"score":0.4132674038410187},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.38899946212768555},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3454105257987976},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10466238856315613}],"mesh":[{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009154","descriptor_name":"Mutation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009154","descriptor_name":"Mutation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009154","descriptor_name":"Mutation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009154","descriptor_name":"Mutation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014644","descriptor_name":"Genetic Variation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014644","descriptor_name":"Genetic Variation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014644","descriptor_name":"Genetic Variation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014644","descriptor_name":"Genetic Variation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D017423","descriptor_name":"Sequence Analysis, RNA","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D059014","descriptor_name":"High-Throughput Nucleotide Sequencing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D059014","descriptor_name":"High-Throughput Nucleotide Sequencing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D059014","descriptor_name":"High-Throughput Nucleotide Sequencing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D059014","descriptor_name":"High-Throughput Nucleotide Sequencing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1142/s0219720024500227","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219720024500227","pdf_url":null,"source":{"id":"https://openalex.org/S155349577","display_name":"Journal of Bioinformatics and Computational Biology","issn_l":"0219-7200","issn":["0219-7200","1757-6334"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311754","host_organization_name":"Imperial College Press","host_organization_lineage":["https://openalex.org/P4310311754"],"host_organization_lineage_names":["Imperial College Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Bioinformatics and Computational Biology","raw_type":"journal-article"},{"id":"pmid:39573833","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/39573833","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of bioinformatics and computational biology","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6263769471","display_name":null,"funder_award_id":"823B2095","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W44929223","https://openalex.org/W2042228684","https://openalex.org/W2046267726","https://openalex.org/W2083333507","https://openalex.org/W2103148772","https://openalex.org/W2122421045","https://openalex.org/W2137586531","https://openalex.org/W2176982668","https://openalex.org/W2180913304","https://openalex.org/W2190826983","https://openalex.org/W2323851578","https://openalex.org/W2536940559","https://openalex.org/W2543969678","https://openalex.org/W2617020095","https://openalex.org/W2724264513","https://openalex.org/W2771017358","https://openalex.org/W2783811903","https://openalex.org/W2795871670","https://openalex.org/W2797967795","https://openalex.org/W2804476733","https://openalex.org/W2885227878","https://openalex.org/W2885934659","https://openalex.org/W2885985208","https://openalex.org/W2903083041","https://openalex.org/W2904210127","https://openalex.org/W2947377238","https://openalex.org/W2952666313","https://openalex.org/W2958369942","https://openalex.org/W2977786171","https://openalex.org/W2992995309","https://openalex.org/W3091991776","https://openalex.org/W3094017947","https://openalex.org/W3132948359","https://openalex.org/W3190031729","https://openalex.org/W3196875131","https://openalex.org/W3200852171","https://openalex.org/W3213714780","https://openalex.org/W4200282656","https://openalex.org/W4224013007","https://openalex.org/W4283212618","https://openalex.org/W4294675778","https://openalex.org/W4294734216","https://openalex.org/W4298127828","https://openalex.org/W4299701259","https://openalex.org/W4308873556"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2183842793","https://openalex.org/W4255676640","https://openalex.org/W2485259751","https://openalex.org/W4236216870","https://openalex.org/W4243876796","https://openalex.org/W2485273903","https://openalex.org/W2482041988","https://openalex.org/W2489685223","https://openalex.org/W2497349655"],"abstract_inverted_index":{"SAKit":[0,48,72],"is":[1,49],"a":[2,39,60,67],"robust":[3],"and":[4,16,34,46,52,58,76],"versatile":[5],"bioinformatics":[6],"tool":[7],"designed":[8],"for":[9,42,80],"the":[10,23,81],"comprehensive":[11],"identification":[12],"of":[13,25,32,78],"both":[14],"large-scale":[15],"small-scale":[17],"variants":[18],"from":[19],"RNA-seq":[20],"data,":[21,37],"facilitating":[22],"discovery":[24],"novel":[26],"proteins.":[27],"This":[28],"pipeline":[29],"integrates":[30],"analysis":[31],"long-read":[33],"short-read":[35],"sequencing":[36],"offering":[38],"powerful":[40],"solution":[41],"researchers":[43],"in":[44],"genomics":[45],"transcriptomics.":[47],"freely":[50],"accessible":[51],"open-source,":[53],"available":[54],"through":[55],"GitHub":[56],"(https://github.com/therarna/SAKit)":[57],"as":[59],"Docker":[61],"image":[62],"https://hub.docker.com/repository/docker/therarna).":[63],"Implemented":[64],"primarily":[65],"within":[66],"Snakemake":[68],"framework":[69],"using":[70],"Python,":[71],"ensures":[73],"reproducibility,":[74],"scalability,":[75],"ease":[77],"use":[79],"scientific":[82],"community.":[83]},"counts_by_year":[],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2025-10-10T00:00:00"}
