{"id":"https://openalex.org/W4416978910","doi":"https://doi.org/10.1021/acs.jcim.5c02437","title":"ProSECFPs: A Novel Fingerprint-Based Protein Representation Method for Missense Mutation Pathogenicity Prediction","display_name":"ProSECFPs: A Novel Fingerprint-Based Protein Representation Method for Missense Mutation Pathogenicity Prediction","publication_year":2025,"publication_date":"2025-12-04","ids":{"openalex":"https://openalex.org/W4416978910","doi":"https://doi.org/10.1021/acs.jcim.5c02437","pmid":"https://pubmed.ncbi.nlm.nih.gov/41340413"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c02437","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c02437","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116466702","display_name":"Clarissa Poles","orcid":null},"institutions":[{"id":"https://openalex.org/I4210149489","display_name":"Scuola Superiore Meridionale","ror":"https://ror.org/04swxte59","country_code":"IT","type":"education","lineage":["https://openalex.org/I4210149489"]},{"id":"https://openalex.org/I4210152213","display_name":"Telethon Institute Of Genetics And Medicine","ror":"https://ror.org/04xfdsg27","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210152213"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Clarissa Poles","raw_affiliation_strings":["Genomics and Experimental Medicine Program, Scuola Superiore Meridionale (SSM, School of Advanced Studies), Via Mezzocannone 4, 80078 Napoli, Italy","Telethon Institute of Genetics and Medicine, Via Campi Flegrei 34, 80078 Napoli, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Genomics and Experimental Medicine Program, Scuola Superiore Meridionale (SSM, School of Advanced Studies), Via Mezzocannone 4, 80078 Napoli, Italy","institution_ids":["https://openalex.org/I4210149489"]},{"raw_affiliation_string":"Telethon Institute of Genetics and Medicine, Via Campi Flegrei 34, 80078 Napoli, Italy","institution_ids":["https://openalex.org/I4210152213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063076795","display_name":"Miriana Di Stefano","orcid":"https://orcid.org/0000-0001-6727-5816"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Miriana Di Stefano","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy"],"raw_orcid":"https://orcid.org/0000-0001-6727-5816","affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103038719","display_name":"Lisa Piazza","orcid":"https://orcid.org/0009-0007-5062-4590"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Lisa Piazza","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy"],"raw_orcid":"https://orcid.org/0009-0007-5062-4590","affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038293326","display_name":"Giulia Bononi","orcid":"https://orcid.org/0000-0002-4336-4344"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giulia Bononi","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy"],"raw_orcid":"https://orcid.org/0000-0002-4336-4344","affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042899314","display_name":"Giulio Poli","orcid":"https://orcid.org/0000-0002-8061-5632"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giulio Poli","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy"],"raw_orcid":"https://orcid.org/0000-0002-8061-5632","affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054823471","display_name":"Marco Macchia","orcid":"https://orcid.org/0000-0002-5565-2044"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Macchia","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tiziano Tuccinardi","orcid":"https://orcid.org/0000-0002-6205-4069"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]},{"id":"https://openalex.org/I2801004183","display_name":"Temple College","ror":"https://ror.org/038s1ax16","country_code":"US","type":"education","lineage":["https://openalex.org/I2801004183"]},{"id":"https://openalex.org/I84392919","display_name":"Temple University","ror":"https://ror.org/00kx1jb78","country_code":"US","type":"education","lineage":["https://openalex.org/I84392919"]}],"countries":["IT","US"],"is_corresponding":true,"raw_author_name":"Tiziano Tuccinardi","raw_affiliation_strings":["Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology","Temple University","Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology, Temple University, Philadelphia, Pennsylvania 19122, United States"],"raw_orcid":"https://orcid.org/0000-0002-6205-4069","affiliations":[{"raw_affiliation_string":"Department of Pharmacy, University of Pisa, Via Bonanno 6, 56126 Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]},{"raw_affiliation_string":"Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology","institution_ids":[]},{"raw_affiliation_string":"Temple University","institution_ids":["https://openalex.org/I2801004183","https://openalex.org/I84392919"]},{"raw_affiliation_string":"Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology, Temple University, Philadelphia, Pennsylvania 19122, United States","institution_ids":["https://openalex.org/I84392919"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024798356","display_name":"Antonio Giordano","orcid":"https://orcid.org/0000-0002-5959-016X"},"institutions":[{"id":"https://openalex.org/I2801004183","display_name":"Temple College","ror":"https://ror.org/038s1ax16","country_code":"US","type":"education","lineage":["https://openalex.org/I2801004183"]},{"id":"https://openalex.org/I84392919","display_name":"Temple University","ror":"https://ror.org/00kx1jb78","country_code":"US","type":"education","lineage":["https://openalex.org/I84392919"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Antonio Giordano","raw_affiliation_strings":["Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology","Temple University","Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology, Temple University, Philadelphia, Pennsylvania 19122, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology","institution_ids":[]},{"raw_affiliation_string":"Temple University","institution_ids":["https://openalex.org/I2801004183","https://openalex.org/I84392919"]},{"raw_affiliation_string":"Sbarro Institute for Cancer Research and Molecular Medicine, Center for Biotechnology, College of Science and Technology, Temple University, Philadelphia, Pennsylvania 19122, United States","institution_ids":["https://openalex.org/I84392919"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I108290504","https://openalex.org/I2801004183","https://openalex.org/I84392919"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.31687327,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"65","issue":"24","first_page":"13478","last_page":"13492"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.7572000026702881,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.7572000026702881,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.1534000039100647,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.02419999986886978,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/missense-mutation","display_name":"Missense mutation","score":0.6901000142097473},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.6060000061988831},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5342000126838684},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.522599995136261},{"id":"https://openalex.org/keywords/pathogenicity","display_name":"Pathogenicity","score":0.5090000033378601},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4535999894142151},{"id":"https://openalex.org/keywords/cheminformatics","display_name":"Cheminformatics","score":0.4528000056743622},{"id":"https://openalex.org/keywords/pseudo-amino-acid-composition","display_name":"Pseudo amino acid composition","score":0.3977999985218048},{"id":"https://openalex.org/keywords/mutation","display_name":"Mutation","score":0.39340001344680786},{"id":"https://openalex.org/keywords/protein-structure-prediction","display_name":"Protein structure prediction","score":0.3695000112056732}],"concepts":[{"id":"https://openalex.org/C75563809","wikidata":"https://www.wikidata.org/wiki/Q2656896","display_name":"Missense mutation","level":4,"score":0.6901000142097473},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.6060000061988831},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5922999978065491},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5907999873161316},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5342000126838684},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5293999910354614},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.522599995136261},{"id":"https://openalex.org/C64502627","wikidata":"https://www.wikidata.org/wiki/Q170065","display_name":"Pathogenicity","level":2,"score":0.5090000033378601},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4702000021934509},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4535999894142151},{"id":"https://openalex.org/C68762167","wikidata":"https://www.wikidata.org/wiki/Q910164","display_name":"Cheminformatics","level":2,"score":0.4528000056743622},{"id":"https://openalex.org/C2780362125","wikidata":"https://www.wikidata.org/wiki/Q7254464","display_name":"Pseudo amino acid composition","level":4,"score":0.3977999985218048},{"id":"https://openalex.org/C501734568","wikidata":"https://www.wikidata.org/wiki/Q42918","display_name":"Mutation","level":3,"score":0.39340001344680786},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.3806000053882599},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.3695000112056732},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.36820000410079956},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.3546000123023987},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.32269999384880066},{"id":"https://openalex.org/C111364199","wikidata":"https://www.wikidata.org/wiki/Q2915896","display_name":"Protein methods","level":4,"score":0.3149000108242035},{"id":"https://openalex.org/C11804247","wikidata":"https://www.wikidata.org/wiki/Q896177","display_name":"Protein\u2013protein interaction","level":2,"score":0.30399999022483826},{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.3034000098705292},{"id":"https://openalex.org/C144292202","wikidata":"https://www.wikidata.org/wiki/Q898273","display_name":"Protein domain","level":3,"score":0.288100004196167},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2870999872684479},{"id":"https://openalex.org/C171897839","wikidata":"https://www.wikidata.org/wiki/Q417841","display_name":"Protein family","level":3,"score":0.2773999869823456},{"id":"https://openalex.org/C207060522","wikidata":"https://www.wikidata.org/wiki/Q7251473","display_name":"Protein function prediction","level":4,"score":0.27619999647140503},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.27230000495910645},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.2671000063419342},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C51679486","wikidata":"https://www.wikidata.org/wiki/Q380546","display_name":"DNA sequencing","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C2986374874","wikidata":"https://www.wikidata.org/wiki/Q8054","display_name":"Protein function","level":3,"score":0.2578999996185303},{"id":"https://openalex.org/C178180057","wikidata":"https://www.wikidata.org/wiki/Q7251477","display_name":"Protein superfamily","level":3,"score":0.2549000084400177},{"id":"https://openalex.org/C61053724","wikidata":"https://www.wikidata.org/wiki/Q1154615","display_name":"Sequence analysis","level":3,"score":0.2515999972820282}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D020125","descriptor_name":"Mutation, Missense","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020125","descriptor_name":"Mutation, Missense","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1021/acs.jcim.5c02437","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c02437","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:41340413","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41340413","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:arpi.unipi.it:11568/1355967","is_oa":false,"landing_page_url":"https://hdl.handle.net/11568/1355967","pdf_url":null,"source":{"id":"https://openalex.org/S4377196265","display_name":"CINECA IRIS Institutial research information system (University of Pisa)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I108290504","host_organization_name":"University of Pisa","host_organization_lineage":["https://openalex.org/I108290504"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6415171107","display_name":null,"funder_award_id":"CUP I53C22000780001","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"},{"id":"https://openalex.org/G7644367572","display_name":null,"funder_award_id":"PNRR ECS00000017","funder_id":"https://openalex.org/F7311471023","funder_display_name":"NextGenerationEU"}],"funders":[{"id":"https://openalex.org/F4320321873","display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","ror":"https://ror.org/0166hxq48"},{"id":"https://openalex.org/F7311471023","display_name":"NextGenerationEU","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W14024944","https://openalex.org/W1496604422","https://openalex.org/W1563940013","https://openalex.org/W1564121197","https://openalex.org/W1985505753","https://openalex.org/W1988037271","https://openalex.org/W2024213882","https://openalex.org/W2025580327","https://openalex.org/W2036350498","https://openalex.org/W2038059723","https://openalex.org/W2040870580","https://openalex.org/W2042084565","https://openalex.org/W2043338013","https://openalex.org/W2047672715","https://openalex.org/W2056132907","https://openalex.org/W2075006095","https://openalex.org/W2077450748","https://openalex.org/W2132292391","https://openalex.org/W2143238378","https://openalex.org/W2145957695","https://openalex.org/W2160979370","https://openalex.org/W2174602966","https://openalex.org/W2342603028","https://openalex.org/W2521967673","https://openalex.org/W2889677957","https://openalex.org/W2911839817","https://openalex.org/W2911964244","https://openalex.org/W2952209472","https://openalex.org/W2999309192","https://openalex.org/W3025885307","https://openalex.org/W3035302862","https://openalex.org/W3114444973","https://openalex.org/W3136918052","https://openalex.org/W3177828909","https://openalex.org/W3195375135","https://openalex.org/W3209435229","https://openalex.org/W3211291051","https://openalex.org/W4206002704","https://openalex.org/W4223644783","https://openalex.org/W4285594705","https://openalex.org/W4296002892","https://openalex.org/W4310332067","https://openalex.org/W4313531466","https://openalex.org/W4323309784","https://openalex.org/W4327550249","https://openalex.org/W4385563495","https://openalex.org/W4386508152","https://openalex.org/W4386624928","https://openalex.org/W4387348861","https://openalex.org/W4388523068","https://openalex.org/W4389174567","https://openalex.org/W4389453216","https://openalex.org/W4389472984","https://openalex.org/W4403265049","https://openalex.org/W4405988325","https://openalex.org/W4411388612","https://openalex.org/W4412426792","https://openalex.org/W4414340177"],"related_works":[],"abstract_inverted_index":{"Developing":[0],"effective":[1],"computational":[2,14,156],"representations":[3,19],"of":[4,13,82,92,100,158],"protein":[5,74,127,173],"sequences":[6],"is":[7],"crucial":[8],"for":[9,165],"advancing":[10],"diverse":[11,98],"areas":[12],"biology":[15],"and":[16,29,69,80,104,143,153,172],"bioinformatics.":[17],"Ideal":[18],"must":[20],"be":[21],"computationally":[22],"efficient,":[23],"scalable,":[24],"informative,":[25],"flexible":[26],"across":[27],"contexts,":[28],"broadly":[30],"applicable.":[31],"To":[32],"address":[33],"these":[34],"requirements,":[35],"we":[36],"propose":[37],"Protein":[38],"Sequence":[39],"Extended-Connectivity":[40,49],"Fingerprints":[41,50],"(ProSECFPs),":[42],"a":[43,97,150,162],"novel":[44],"fingerprinting":[45],"method":[46],"inspired":[47],"by":[48,84,95],"(ECFPs),":[51],"commonly":[52],"used":[53],"in":[54,88,169],"chemoinformatics":[55],"to":[56,73,137],"represent":[57],"small":[58],"molecules.":[59],"ProSECFPs":[60,83,147],"effectively":[61],"capture":[62],"the":[63,78,90],"complex":[64],"physicochemical":[65],"characteristics,":[66],"sequence-specific":[67],"details,":[68],"structural":[70],"attributes":[71],"intrinsic":[72],"sequences.":[75],"We":[76],"demonstrate":[77],"effectiveness":[79],"versatility":[81],"evaluating":[85],"their":[86,116,135],"performance":[87,132],"predicting":[89],"pathogenicity":[91],"missense":[93],"mutations":[94],"applying":[96],"set":[99],"machine":[101],"learning":[102,106],"(ML)":[103],"deep":[105],"(DL)":[107],"algorithms.":[108],"Notably,":[109],"our":[110],"results":[111],"indicate":[112],"that":[113],"ProSECFPs,":[114],"especially":[115],"frequency-aware":[117],"variants,":[118],"achieve":[119],"competitive":[120],"or":[121],"superior":[122],"accuracy":[123],"compared":[124],"with":[125],"established":[126],"sequence":[128,145],"descriptors.":[129],"This":[130],"enhanced":[131],"arises":[133],"from":[134],"ability":[136],"comprehensively":[138],"integrate":[139],"amino":[140],"acid":[141],"composition":[142],"detailed":[144],"information.":[146],"thus":[148],"provide":[149],"robust,":[151],"adaptable,":[152],"highly":[154],"informative":[155],"representation":[157],"proteins,":[159],"serving":[160],"as":[161],"powerful":[163],"foundation":[164],"addressing":[166],"interdisciplinary":[167],"challenges":[168],"bioinformatics,":[170],"genomics,":[171],"engineering.":[174]},"counts_by_year":[],"updated_date":"2026-05-10T08:33:47.465468","created_date":"2025-12-04T00:00:00"}
