{"id":"https://openalex.org/W4408617735","doi":"https://doi.org/10.1021/acs.jcim.5c00199","title":"CPPCGM: A Highly Efficient Sequence-Based Tool for Simultaneously Identifying and Generating Cell-Penetrating Peptides","display_name":"CPPCGM: A Highly Efficient Sequence-Based Tool for Simultaneously Identifying and Generating Cell-Penetrating Peptides","publication_year":2025,"publication_date":"2025-03-19","ids":{"openalex":"https://openalex.org/W4408617735","doi":"https://doi.org/10.1021/acs.jcim.5c00199","pmid":"https://pubmed.ncbi.nlm.nih.gov/40105337"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c00199","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00199","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043775363","display_name":"Qiufen Chen","orcid":"https://orcid.org/0000-0002-8752-571X"},"institutions":[{"id":"https://openalex.org/I4210102541","display_name":"Shenzhen Bay Laboratory","ror":"https://ror.org/00sdcjz77","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210102541"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiufen Chen","raw_affiliation_strings":["Institute of Systems and Physical Biology","Shenzhen Bay Laboratory"],"affiliations":[{"raw_affiliation_string":"Institute of Systems and Physical Biology","institution_ids":[]},{"raw_affiliation_string":"Shenzhen Bay Laboratory","institution_ids":["https://openalex.org/I4210102541"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101975970","display_name":"Yuewei Zhang","orcid":"https://orcid.org/0000-0001-6696-0336"},"institutions":[{"id":"https://openalex.org/I4210102541","display_name":"Shenzhen Bay Laboratory","ror":"https://ror.org/00sdcjz77","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210102541"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuewei Zhang","raw_affiliation_strings":["Institute of Systems and Physical Biology","Shenzhen Bay Laboratory"],"affiliations":[{"raw_affiliation_string":"Institute of Systems and Physical Biology","institution_ids":[]},{"raw_affiliation_string":"Shenzhen Bay Laboratory","institution_ids":["https://openalex.org/I4210102541"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051728653","display_name":"Jiali Gao","orcid":"https://orcid.org/0000-0003-0106-7154"},"institutions":[{"id":"https://openalex.org/I4210102541","display_name":"Shenzhen Bay Laboratory","ror":"https://ror.org/00sdcjz77","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210102541"]},{"id":"https://openalex.org/I4210128628","display_name":"Peking University Shenzhen Hospital","ror":"https://ror.org/03kkjyb15","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210128628"]},{"id":"https://openalex.org/I2800403580","display_name":"University of Minnesota System","ror":"https://ror.org/03grvy078","country_code":"US","type":"education","lineage":["https://openalex.org/I2800403580"]}],"countries":["CN","US"],"is_corresponding":true,"raw_author_name":"Jiali Gao","raw_affiliation_strings":["Department of Chemistry and Supercomputing Institute","Institute of Systems and Physical Biology","Peking University Shenzhen Graduate School","School of Chemical Biology and Biotechnology","Shenzhen Bay Laboratory","University of Minnesota"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Supercomputing Institute","institution_ids":[]},{"raw_affiliation_string":"Institute of Systems and Physical Biology","institution_ids":[]},{"raw_affiliation_string":"Peking University Shenzhen Graduate School","institution_ids":["https://openalex.org/I4210128628"]},{"raw_affiliation_string":"School of Chemical Biology and Biotechnology","institution_ids":[]},{"raw_affiliation_string":"Shenzhen Bay Laboratory","institution_ids":["https://openalex.org/I4210102541"]},{"raw_affiliation_string":"University of Minnesota","institution_ids":["https://openalex.org/I2800403580"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100433085","display_name":"Jun Zhang","orcid":"https://orcid.org/0000-0001-9093-9430"},"institutions":[{"id":"https://openalex.org/I4210102541","display_name":"Shenzhen Bay Laboratory","ror":"https://ror.org/00sdcjz77","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210102541"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jun Zhang","raw_affiliation_strings":["Institute of Systems and Physical Biology","Shenzhen Bay Laboratory"],"affiliations":[{"raw_affiliation_string":"Institute of Systems and Physical Biology","institution_ids":[]},{"raw_affiliation_string":"Shenzhen Bay Laboratory","institution_ids":["https://openalex.org/I4210102541"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5051728653","https://openalex.org/A5100433085"],"corresponding_institution_ids":["https://openalex.org/I2800403580","https://openalex.org/I4210102541","https://openalex.org/I4210128628"],"apc_list":null,"apc_paid":null,"fwci":1.7129,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.8229354,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"65","issue":"7","first_page":"3357","last_page":"3369"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10725","display_name":"RNA Interference and Gene Delivery","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10725","display_name":"RNA Interference and Gene Delivery","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10207","display_name":"Advanced biosensing and bioanalysis techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11103","display_name":"Antimicrobial Peptides and Activities","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/2404","display_name":"Microbiology"},"field":{"id":"https://openalex.org/fields/24","display_name":"Immunology and Microbiology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6839653849601746},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5366456508636475},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.45101669430732727},{"id":"https://openalex.org/keywords/cell","display_name":"Cell","score":0.4163425862789154},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.3688110113143921},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.3650856614112854},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33255380392074585},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2067127525806427},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.18394452333450317}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6839653849601746},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5366456508636475},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45101669430732727},{"id":"https://openalex.org/C1491633281","wikidata":"https://www.wikidata.org/wiki/Q7868","display_name":"Cell","level":2,"score":0.4163425862789154},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.3688110113143921},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.3650856614112854},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33255380392074585},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2067127525806427},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.18394452333450317}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057846","descriptor_name":"Cell-Penetrating Peptides","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D057846","descriptor_name":"Cell-Penetrating Peptides","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.5c00199","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c00199","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:40105337","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40105337","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3300963630","display_name":null,"funder_award_id":"S201101003","funder_id":"https://openalex.org/F4320331248","funder_display_name":"Shenzhen Bay Laboratory"}],"funders":[{"id":"https://openalex.org/F4320331248","display_name":"Shenzhen Bay Laboratory","ror":"https://ror.org/00sdcjz77"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W1499864241","https://openalex.org/W1515068677","https://openalex.org/W1584683177","https://openalex.org/W1985718949","https://openalex.org/W1986299453","https://openalex.org/W1996461253","https://openalex.org/W2058839892","https://openalex.org/W2068130700","https://openalex.org/W2069182579","https://openalex.org/W2079335891","https://openalex.org/W2081159379","https://openalex.org/W2096023347","https://openalex.org/W2101105183","https://openalex.org/W2102544846","https://openalex.org/W2117692326","https://openalex.org/W2168639488","https://openalex.org/W2220780917","https://openalex.org/W2305144260","https://openalex.org/W2414310543","https://openalex.org/W2573068944","https://openalex.org/W2608969085","https://openalex.org/W2737196618","https://openalex.org/W2766725728","https://openalex.org/W2784083480","https://openalex.org/W2796024961","https://openalex.org/W2807896518","https://openalex.org/W2884031225","https://openalex.org/W2888163308","https://openalex.org/W2891290193","https://openalex.org/W2894167212","https://openalex.org/W2896457183","https://openalex.org/W2897866928","https://openalex.org/W2901179927","https://openalex.org/W2912990441","https://openalex.org/W2914645084","https://openalex.org/W2950793881","https://openalex.org/W2955560891","https://openalex.org/W2960810917","https://openalex.org/W2970597249","https://openalex.org/W2972835519","https://openalex.org/W2987102131","https://openalex.org/W3009631698","https://openalex.org/W3010907323","https://openalex.org/W3027325047","https://openalex.org/W3040739508","https://openalex.org/W3042130878","https://openalex.org/W3104361293","https://openalex.org/W3120503577","https://openalex.org/W3135156311","https://openalex.org/W3143638934","https://openalex.org/W3144701084","https://openalex.org/W3146944767","https://openalex.org/W3154802692","https://openalex.org/W3172444956","https://openalex.org/W3190906682","https://openalex.org/W3195743187","https://openalex.org/W3213557594","https://openalex.org/W4205773061","https://openalex.org/W4206662285","https://openalex.org/W4213270355","https://openalex.org/W4225008496","https://openalex.org/W4285587917","https://openalex.org/W4287824654","https://openalex.org/W4292059000","https://openalex.org/W4298289240","https://openalex.org/W4309148686","https://openalex.org/W4309506674","https://openalex.org/W4312113926","https://openalex.org/W4312126054","https://openalex.org/W4324344300","https://openalex.org/W4382679852","https://openalex.org/W4385245566","https://openalex.org/W4392985130"],"related_works":["https://openalex.org/W2112284452","https://openalex.org/W3188962172","https://openalex.org/W2772917594","https://openalex.org/W4312825515","https://openalex.org/W4306742369","https://openalex.org/W4303457083","https://openalex.org/W2131146434","https://openalex.org/W3085798047","https://openalex.org/W2951359407","https://openalex.org/W2374269412"],"abstract_inverted_index":{"Cell-penetrating":[0],"peptides":[1,148,220],"(CPPs)":[2],"are":[3,108,150,232],"usually":[4],"short":[5],"oligopeptides":[6],"with":[7,184],"5-30":[8],"amino":[9],"acid":[10],"residues.":[11],"CPPs":[12,38,130],"have":[13,47],"been":[14,48],"proven":[15],"as":[16,29,54],"important":[17],"drug":[18,225],"delivery":[19,226],"vehicles":[20],"into":[21],"cells":[22],"through":[23,205],"different":[24],"mechanisms,":[25],"demonstrating":[26],"their":[27],"potential":[28,63,79,202],"therapeutic":[30],"candidates.":[31,65],"However,":[32],"experimental":[33],"screening":[34,59],"and":[35,42,103,116,131,144,172,207,227],"synthesis":[36],"of":[37,62,169,190,203,210],"could":[39],"be":[40],"time-consuming":[41],"expensive.":[43],"Recently,":[44],"numerous":[45],"attempts":[46],"made":[49],"to":[50,101,136],"develop":[51],"computational":[52],"methods":[53,70,217],"a":[55,60,89,137,142,145],"cost-effective":[56],"way":[57],"for":[58,80,124,221],"number":[61],"CPP":[64],"Despite":[66],"significant":[67],"advancements,":[68],"current":[69],"exhibit":[71],"limited":[72],"feature":[73],"representation":[74],"capabilities,":[75],"thereby":[76,127],"constraining":[77],"the":[78,154,180,185,188,200,211],"further":[81],"performance":[82,189],"enhancements.":[83],"In":[84],"this":[85,113],"study,":[86],"we":[87],"developed":[88],"deep":[90],"learning":[91],"framework":[92],"called":[93],"CPPCGM,":[94],"which":[95],"uses":[96],"protein":[97],"language":[98],"models":[99,123],"(PLMs)":[100],"identify":[102],"generate":[104],"novel":[105],"CPPs.":[106],"There":[107],"two":[109],"separate":[110],"blocks":[111],"in":[112,153],"framework:":[114],"CPPClassifier":[115],"CPPGenerator.":[117],"The":[118,133,196],"former":[119],"utilizes":[120],"three":[121,175],"pretrained":[122],"simple":[125],"voting,":[126],"accurately":[128],"categorizing":[129],"non-CPPs.":[132],"latter,":[134],"similar":[135],"generative":[138],"adversarial":[139],"network,":[140],"including":[141],"discriminator":[143],"generator,":[146],"generates":[147],"that":[149],"not":[151],"present":[152],"training":[155],"data":[156,176],"set.":[157],"Our":[158],"proposed":[159],"CPPCGM":[160,204],"has":[161],"achieved":[162],"remarkably":[163],"high":[164],"Matthews":[165],"correlation":[166],"coefficient":[167],"scores":[168],"0.876,":[170],"0.923,":[171],"0.664":[173],"on":[174,179],"sets":[177],"based":[178],"classification":[181],"results.":[182],"Compared":[183],"state-of-the-art":[186],"methods,":[187],"our":[191],"method":[192],"is":[193],"significantly":[194],"improved.":[195],"results":[197],"also":[198],"demonstrated":[199],"generating":[201],"qualitative":[206],"quantitative":[208],"evaluation":[209],"generated":[212],"samples.":[213],"Significantly,":[214],"using":[215],"PLM-based":[216],"can":[218],"optimize":[219],"biochemical":[222],"functions,":[223],"benefiting":[224],"biomedical":[228],"applications.":[229],"Materials":[230],"related":[231],"publicly":[233],"available":[234],"at":[235],"https://github.com/QiufenChen/CPPCGM.":[236]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
