{"id":"https://openalex.org/W7138080177","doi":"https://doi.org/10.1609/aaai.v40i1.36997","title":"S\u00b2Drug: Bridging Protein Sequence and 3D Structure in Contrastive Representation Learning for Virtual Screening","display_name":"S\u00b2Drug: Bridging Protein Sequence and 3D Structure in Contrastive Representation Learning for Virtual Screening","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138080177","doi":"https://doi.org/10.1609/aaai.v40i1.36997"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i1.36997","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.36997","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/36997/40959","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/36997/40959","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129725759","display_name":"Bowei He","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Bowei He","raw_affiliation_strings":["City University of Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"City University of Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129730461","display_name":"Bowen Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bowen Gao","raw_affiliation_strings":["Institute for AI Industry Research (AIR), Tsinghua University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI Industry Research (AIR), Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129668559","display_name":"Yankai Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yankai Chen","raw_affiliation_strings":["University of Illinois Chicago"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois Chicago","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121821741","display_name":"Yanyan Lan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanyan Lan","raw_affiliation_strings":["Institute for AI Industry Research (AIR), Tsinghua University\nBeijing Academy of Artificial Intelligence"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI Industry Research (AIR), Tsinghua University\nBeijing Academy of Artificial Intelligence","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129737370","display_name":"Chen Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Chen Ma","raw_affiliation_strings":["City University of Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"City University of Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036357902","display_name":"Philip S. Yu","orcid":"https://orcid.org/0000-0002-3491-5968"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Philip S. Yu","raw_affiliation_strings":["University of Illinois Chicago"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois Chicago","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129715953","display_name":"Ya-Qin Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ya-Qin Zhang","raw_affiliation_strings":["Institute for AI Industry Research (AIR), Tsinghua University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI Industry Research (AIR), Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129678901","display_name":"Wei-Ying Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei-Ying Ma","raw_affiliation_strings":["Institute for AI Industry Research (AIR), Tsinghua University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI Industry Research (AIR), Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5129725759"],"corresponding_institution_ids":["https://openalex.org/I168719708"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21428571,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"1","first_page":"354","last_page":"362"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.5360000133514404,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.5360000133514404,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.23510000109672546,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.09009999781847,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.520799994468689},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5182999968528748},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5164999961853027},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4499000012874603},{"id":"https://openalex.org/keywords/virtual-screening","display_name":"Virtual screening","score":0.43529999256134033},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.38609999418258667},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35019999742507935},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.3499999940395355}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7135000228881836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6327999830245972},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.520799994468689},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5182999968528748},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5164999961853027},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4499000012874603},{"id":"https://openalex.org/C103697762","wikidata":"https://www.wikidata.org/wiki/Q4112105","display_name":"Virtual screening","level":3,"score":0.43529999256134033},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.38609999418258667},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37059998512268066},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35019999742507935},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.3499999940395355},{"id":"https://openalex.org/C40506919","wikidata":"https://www.wikidata.org/wiki/Q7452469","display_name":"Sequence learning","level":2,"score":0.34790000319480896},{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.3463999927043915},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3314000070095062},{"id":"https://openalex.org/C200307862","wikidata":"https://www.wikidata.org/wiki/Q7797175","display_name":"Threading (protein sequence)","level":3,"score":0.32359999418258667},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3000999987125397},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C63222358","wikidata":"https://www.wikidata.org/wiki/Q6120337","display_name":"chEMBL","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C171897839","wikidata":"https://www.wikidata.org/wiki/Q417841","display_name":"Protein family","level":3,"score":0.2671000063419342},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C136475424","wikidata":"https://www.wikidata.org/wiki/Q7251500","display_name":"Protein structure database","level":4,"score":0.25209999084472656},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i1.36997","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.36997","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/36997/40959","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i1.36997","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.36997","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/36997/40959","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309893","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335581","display_name":"Young Scientists Fund","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138080177.pdf","grobid_xml":"https://content.openalex.org/works/W7138080177.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Virtual":[0],"screening":[1,187],"(VS)":[2],"is":[3],"an":[4,107,149],"essential":[5],"task":[6,157],"in":[7,66,90,205],"drug":[8],"discovery,":[9],"focusing":[10],"on":[11,38,104,122,134,193],"the":[12,62,96,129,159,167,198],"identification":[13],"of":[14,200],"small-molecule":[15],"ligands":[16],"that":[17,80],"bind":[18],"to":[19,31,61,117,161],"specific":[20],"protein":[21,43,56,83,101,124,168],"pockets.":[22],"Existing":[23],"deep":[24],"learning":[25,34],"methods,":[26],"from":[27],"early":[28],"regression":[29],"models":[30],"recent":[32],"contrastive":[33,92,206],"approaches,":[35],"primarily":[36],"rely":[37],"structural":[39],"data":[40,114],"while":[41,147],"overlooking":[42],"sequences,":[44],"which":[45],"are":[46],"more":[47],"accessible":[48],"and":[49,64,86,120,125,139,170,189,203],"can":[50],"enhance":[51],"generalizability.":[52],"However,":[53],"directly":[54],"integrating":[55],"sequences":[57],"poses":[58],"challenges":[59],"due":[60],"redundancy":[63,119],"noise":[65,121],"large-scale":[67],"protein-ligand":[68,91,178],"datasets.":[69],"To":[70],"address":[71],"these":[72],"limitations,":[73],"we":[74,99,132],"propose":[75],"S\u00b2Drug,":[76],"a":[77,112,143],"two-stage":[78],"framework":[79],"explicitly":[81],"incorporates":[82],"Sequence":[84],"information":[85,141],"3D":[87,173],"Structure":[88],"context":[89],"representation":[93],"learning.":[94,207],"In":[95,128],"first":[97],"stage,":[98,131],"perform":[100],"sequence":[102,138,169,202],"pretraining":[103],"ChemBL":[105],"using":[106],"ESM2-based":[108],"backbone,":[109],"combined":[110],"with":[111],"tailored":[113],"sampling":[115],"strategy":[116],"reduce":[118],"both":[123],"ligand":[126],"sides.":[127],"second":[130],"fine-tune":[133],"PDBBind":[135],"by":[136],"fusing":[137],"structure":[140,204],"through":[142],"residue-level":[144],"gating":[145],"module,":[146],"introducing":[148],"auxiliary":[150,156],"binding":[151,164,194],"site":[152,195],"prediction":[153],"task.":[154],"This":[155],"guides":[158],"model":[160],"accurately":[162],"localize":[163],"residues":[165],"within":[166],"capture":[171],"their":[172],"spatial":[174],"arrangement,":[175],"thereby":[176],"refining":[177],"matching.":[179],"Across":[180],"multiple":[181],"benchmarks,":[182],"S\u00b2Drug":[183],"consistently":[184],"improves":[185],"virtual":[186],"performance":[188],"achieves":[190],"strong":[191],"results":[192],"prediction,":[196],"demonstrating":[197],"value":[199],"bridging":[201]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2026-03-18T00:00:00"}
