{"id":"https://openalex.org/W4416286408","doi":"https://doi.org/10.1109/tcbbio.2025.3633384","title":"GTLSTMEP: A Novel Model Based on Graph Transformer and bi-LSTM for Predicting Essential Proteins in Sampled Subgraphs","display_name":"GTLSTMEP: A Novel Model Based on Graph Transformer and bi-LSTM for Predicting Essential Proteins in Sampled Subgraphs","publication_year":2025,"publication_date":"2025-11-17","ids":{"openalex":"https://openalex.org/W4416286408","doi":"https://doi.org/10.1109/tcbbio.2025.3633384","pmid":"https://pubmed.ncbi.nlm.nih.gov/41247900"},"language":"en","primary_location":{"id":"doi:10.1109/tcbbio.2025.3633384","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbbio.2025.3633384","pdf_url":null,"source":{"id":"https://openalex.org/S5407042751","display_name":"IEEE Transactions on Computational Biology and Bioinformatics","issn_l":"2998-4165","issn":["2998-4165"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100698809","display_name":"He Zhao","orcid":"https://orcid.org/0000-0002-3988-2851"},"institutions":[{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]},{"id":"https://openalex.org/I4210134929","display_name":"Jilin Province Science and Technology Department","ror":"https://ror.org/049x38272","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210134929"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"He Zhao","raw_affiliation_strings":["School of Computer Science and Technology, Jilin University, Changchun, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Jilin University, Changchun, China","institution_ids":["https://openalex.org/I4210134929","https://openalex.org/I194450716"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453381","display_name":"Tao Wang","orcid":"https://orcid.org/0000-0001-5004-160X"},"institutions":[{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]},{"id":"https://openalex.org/I4210134929","display_name":"Jilin Province Science and Technology Department","ror":"https://ror.org/049x38272","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210134929"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Wang","raw_affiliation_strings":["School of Computer Science and Technology, Jilin University, Changchun, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Jilin University, Changchun, China","institution_ids":["https://openalex.org/I4210134929","https://openalex.org/I194450716"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075740101","display_name":"Huan Xu","orcid":"https://orcid.org/0000-0002-4075-3846"},"institutions":[{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]},{"id":"https://openalex.org/I4210134929","display_name":"Jilin Province Science and Technology Department","ror":"https://ror.org/049x38272","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210134929"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huan Xu","raw_affiliation_strings":["School of Computer Science and Technology, Jilin University, Changchun, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Jilin University, Changchun, China","institution_ids":["https://openalex.org/I4210134929","https://openalex.org/I194450716"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113156748","display_name":"Guixia Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I194450716","display_name":"Jilin University","ror":"https://ror.org/00js3aw79","country_code":"CN","type":"education","lineage":["https://openalex.org/I194450716"]},{"id":"https://openalex.org/I4210134929","display_name":"Jilin Province Science and Technology Department","ror":"https://ror.org/049x38272","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210134929"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guixia Liu","raw_affiliation_strings":["School of Computer Science and Technology, Jilin University, Changchun, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Jilin University, Changchun, China","institution_ids":["https://openalex.org/I4210134929","https://openalex.org/I194450716"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100698809"],"corresponding_institution_ids":["https://openalex.org/I194450716","https://openalex.org/I4210134929"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.30932881,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"23","issue":"1","first_page":"39","last_page":"52"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9316999912261963,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9316999912261963,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.01720000058412552,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.007300000172108412,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5113000273704529},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.44040000438690186},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.3833000063896179},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.38190001249313354},{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.3700999915599823},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.3628999888896942},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.3628000020980835},{"id":"https://openalex.org/keywords/laplacian-matrix","display_name":"Laplacian matrix","score":0.3619999885559082}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6040999889373779},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5113000273704529},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.44040000438690186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43149998784065247},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.3833000063896179},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.38190001249313354},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.3700999915599823},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.3628999888896942},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3628000020980835},{"id":"https://openalex.org/C115178988","wikidata":"https://www.wikidata.org/wiki/Q772067","display_name":"Laplacian matrix","level":3,"score":0.3619999885559082},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36149999499320984},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.3571000099182129},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34380000829696655},{"id":"https://openalex.org/C28225019","wikidata":"https://www.wikidata.org/wiki/Q4915005","display_name":"Biological network","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33480000495910645},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.329800009727478},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29249998927116394},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C100595998","wikidata":"https://www.wikidata.org/wiki/Q11731931","display_name":"Graph kernel","level":5,"score":0.2535000145435333},{"id":"https://openalex.org/C140051345","wikidata":"https://www.wikidata.org/wiki/Q7251501","display_name":"Protein subcellular localization prediction","level":3,"score":0.25130000710487366}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcbbio.2025.3633384","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbbio.2025.3633384","pdf_url":null,"source":{"id":"https://openalex.org/S5407042751","display_name":"IEEE Transactions on Computational Biology and Bioinformatics","issn_l":"2998-4165","issn":["2998-4165"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},{"id":"pmid:41247900","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41247900","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on computational biology and bioinformatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1973758399","https://openalex.org/W2005708641","https://openalex.org/W2007245700","https://openalex.org/W2036799174","https://openalex.org/W2079735306","https://openalex.org/W2080124756","https://openalex.org/W2088590769","https://openalex.org/W2089125183","https://openalex.org/W2100371004","https://openalex.org/W2115746733","https://openalex.org/W2124354935","https://openalex.org/W2132582966","https://openalex.org/W2146447390","https://openalex.org/W2148043260","https://openalex.org/W2151296292","https://openalex.org/W2162891889","https://openalex.org/W2340802671","https://openalex.org/W2586452838","https://openalex.org/W2790765877","https://openalex.org/W2911115880","https://openalex.org/W2911569307","https://openalex.org/W2912802963","https://openalex.org/W2915554882","https://openalex.org/W2915975108","https://openalex.org/W2962756421","https://openalex.org/W2991321419","https://openalex.org/W3008459824","https://openalex.org/W3037025616","https://openalex.org/W3037436972","https://openalex.org/W3177371828","https://openalex.org/W3216491494","https://openalex.org/W4289766530","https://openalex.org/W4310594072","https://openalex.org/W4319309781","https://openalex.org/W4366694841","https://openalex.org/W4377011355","https://openalex.org/W4389196583","https://openalex.org/W4392952638","https://openalex.org/W4399447258"],"related_works":[],"abstract_inverted_index":{"Predicting":[0],"essential":[1,150],"proteins":[2],"is":[3,81,173],"crucial":[4],"for":[5,149],"identifying":[6],"disease-causing":[7],"genes":[8],"and":[9,32,53,67,73,107],"advancing":[10],"drug":[11],"discovery.":[12],"However,":[13],"existing":[14],"methods":[15],"face":[16],"challenges,":[17],"such":[18],"as":[19],"insufficient":[20],"capture":[21],"of":[22,29,35,130,186,189],"biological":[23,61],"properties,":[24],"class":[25,85],"imbalance,":[26],"incomplete":[27],"representation":[28],"network":[30],"topology,":[31],"inadequate":[33],"utilization":[34],"edge":[36,74,122],"features.":[37,75],"To":[38],"address":[39],"these":[40,138],"limitations,":[41],"we":[42],"propose":[43],"a":[44,145],"novel":[45],"model,":[46],"GTLSTMEP,":[47],"which":[48],"combines":[49],"Graph":[50],"Transformer":[51],"(GT)":[52],"Bidirectional":[54],"Long":[55],"Short-Term":[56],"Memory":[57],"(bi-LSTM).":[58],"GTLSTMEP":[59,157,168],"leverages":[60],"data-including":[62],"subcellular":[63],"localization,":[64],"protein":[65,131,151],"complexes,":[66],"gene":[68,92],"expression":[69,93],"profiles-to":[70],"initialize":[71],"node":[72,134],"A":[76],"subgraph":[77],"batch":[78],"sampling":[79],"approach":[80],"employed":[82],"to":[83,126],"handle":[84],"imbalance.":[86],"The":[87,133],"bi-LSTM":[88],"module":[89,98],"processes":[90],"time-series":[91],"data,":[94],"while":[95],"the":[96,128,165,177,184],"GT":[97],"captures":[99],"global":[100],"topological":[101,109],"features":[102,110,123,135],"using":[103],"Laplacian":[104],"positional":[105],"encodings":[106],"local":[108],"through":[111],"an":[112,170],"attention":[113],"mechanism":[114],"that":[115,156,172],"automatically":[116],"identifies":[117],"neighboring":[118],"nodes'":[119],"characteristics.":[120],"Additionally,":[121],"are":[124,141],"integrated":[125],"enhance":[127],"learning":[129],"interactions.":[132],"extracted":[136],"from":[137],"two":[139],"modules":[140],"then":[142],"fed":[143],"into":[144],"Multi-Layer":[146],"Perceptron":[147],"(MLP)":[148],"prediction.":[152],"Experimental":[153],"results":[154],"demonstrate":[155],"outperforms":[158],"all":[159],"comparative":[160],"methods.":[161],"For":[162],"instance,":[163],"on":[164],"DIP":[166],"dataset,":[167],"achieves":[169],"$AUC$":[171],"17.64%":[174],"higher":[175],"than":[176],"next-best":[178],"model.":[179],"Ablation":[180],"studies":[181],"further":[182],"confirm":[183],"effectiveness":[185],"each":[187],"component":[188],"GTLSTMEP.":[190]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-11-17T00:00:00"}
