{"id":"https://openalex.org/W7126057104","doi":"https://doi.org/10.1109/bibm66473.2025.11356802","title":"ProtAgent-ESM2: an Efficient Framework for Long Protein Sequences Modeling in Protein-Protein Interaction Prediction","display_name":"ProtAgent-ESM2: an Efficient Framework for Long Protein Sequences Modeling in Protein-Protein Interaction Prediction","publication_year":2025,"publication_date":"2025-12-15","ids":{"openalex":"https://openalex.org/W7126057104","doi":"https://doi.org/10.1109/bibm66473.2025.11356802"},"language":null,"primary_location":{"id":"doi:10.1109/bibm66473.2025.11356802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100446035","display_name":"Hao Wang","orcid":"https://orcid.org/0000-0001-6881-9977"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Huaiyuan Wang","raw_affiliation_strings":["College of Computer Science and Software Engineering, Shenzhen University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Shenzhen University,Shenzhen,China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059502458","display_name":"Changkun Jiang","orcid":"https://orcid.org/0000-0003-2772-2348"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changkun Jiang","raw_affiliation_strings":["College of Computer Science and Software Engineering, Shenzhen University,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Software Engineering, Shenzhen University,Shenzhen,China","institution_ids":["https://openalex.org/I180726961"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100446035"],"corresponding_institution_ids":["https://openalex.org/I180726961"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.67326638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"196","last_page":"201"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.5289000272750854,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.5289000272750854,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.2143000066280365,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.06920000165700912,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5993000268936157},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.551800012588501},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5127000212669373},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.48030000925064087},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.46880000829696655},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.41839998960494995},{"id":"https://openalex.org/keywords/computational-model","display_name":"Computational model","score":0.3912999927997589}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7039999961853027},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5993000268936157},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.551800012588501},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5127000212669373},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.48030000925064087},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.41839998960494995},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41510000824928284},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3912999927997589},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.3772999942302704},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3508000075817108},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3366999924182892},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.3260999917984009},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30160000920295715},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29809999465942383},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.25060001015663147}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm66473.2025.11356802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1982267716","https://openalex.org/W2008840001","https://openalex.org/W2152705149","https://openalex.org/W2162392441","https://openalex.org/W2890911678","https://openalex.org/W2957436444","https://openalex.org/W3177500196","https://openalex.org/W4200461926","https://openalex.org/W4226343290","https://openalex.org/W4327550249","https://openalex.org/W4353066697","https://openalex.org/W4388464011","https://openalex.org/W4388979610","https://openalex.org/W4392500220","https://openalex.org/W4400984795","https://openalex.org/W4401455507","https://openalex.org/W4403944333","https://openalex.org/W4405099223","https://openalex.org/W4406811692","https://openalex.org/W4412454121","https://openalex.org/W4413950477"],"related_works":[],"abstract_inverted_index":{"Existing":[0],"sequence-based":[1],"protein-protein":[2],"interaction":[3],"(PPI)":[4],"prediction":[5],"methods":[6],"face":[7],"a":[8,38,47,100,120],"critical":[9],"bottleneck:":[10],"the":[11,53,152],"quadratic":[12,74],"computational":[13,71,155],"complexity":[14,72],"of":[15],"standard":[16,141],"Transformer":[17],"attention":[18,60],"mechanisms":[19],"often":[20],"necessitates":[21],"models":[22],"to":[23,28,75,125],"truncate":[24],"protein":[25,130],"sequences,":[26],"leading":[27],"information":[29],"loss":[30],"and":[31,99],"performance":[32,127,139,146],"limitations.":[33],"This":[34],"paper":[35],"introduces":[36],"ProtAgent-ESM2,":[37],"novel":[39],"framework":[40,57],"that":[41,104,135],"overcomes":[42],"this":[43],"limitation":[44],"by":[45],"integrating":[46],"protein-specific":[48,85],"Agent":[49],"Attention":[50],"mechanism":[51],"into":[52,62],"ESM-2":[54,107],"backbone.":[55],"Our":[56],"decomposes":[58],"dense":[59],"interactions":[61],"two":[63],"sparse":[64],"stages":[65],"through":[66,95],"learnable":[67],"agent":[68],"tokens,":[69],"reducing":[70],"from":[73],"near-linear":[76],"while":[77,143],"maintaining":[78,144],"global":[79],"context":[80],"modeling":[81,94],"capabilities.":[82],"We":[83],"implement":[84],"adaptations,":[86],"including":[87],"asymmetric":[88],"rotary":[89],"position":[90],"embeddings,":[91],"local":[92],"structure":[93],"depthwise":[96],"separable":[97],"convolutions,":[98],"hybrid":[101],"embedding":[102],"strategy":[103],"combines":[105],"static":[106],"representations":[108],"with":[109],"dynamic":[110],"task-specific":[111],"features.":[112],"To":[113],"validate":[114],"our":[115],"framework,":[116],"we":[117],"construct":[118],"Intra-2-Long,":[119],"challenging":[121],"benchmark":[122],"specifically":[123],"designed":[124],"evaluate":[126],"on":[128,140],"long":[129],"sequences.":[131],"Experimental":[132],"results":[133],"demonstrate":[134],"ProtAgent-ESM2":[136],"achieves":[137],"competitive":[138],"benchmarks":[142],"consistent":[145],"across":[147],"varying":[148],"sequence":[149],"lengths,":[150],"advancing":[151],"state-of-the-art":[153],"in":[154],"PPI":[156],"prediction.":[157]},"counts_by_year":[],"updated_date":"2026-02-01T03:34:12.195049","created_date":"2026-01-30T00:00:00"}
