{"id":"https://openalex.org/W7162633601","doi":"https://doi.org/10.48550/arxiv.2605.27413","title":"Ligand-Conditioned Discrete Diffusion for Protein Sequence-Structure Co-Design","display_name":"Ligand-Conditioned Discrete Diffusion for Protein Sequence-Structure Co-Design","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7162633601","doi":"https://doi.org/10.48550/arxiv.2605.27413"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27413","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27413","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27413","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137193123","display_name":"Chen Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047163587","display_name":"Fanding Xu","orcid":"https://orcid.org/0000-0001-7220-8693"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Fanding","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128014008","display_name":"Minghao Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Minghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137289904","display_name":"Zhiyuan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhiyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137221735","display_name":"Lin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137233254","display_name":"Tianrui Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Tianrui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137220784","display_name":"Yihang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yihang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137271803","display_name":"Yang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5313000082969666,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5313000082969666,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10621","display_name":"Gene Regulatory Network Analysis","score":0.11150000244379044,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.09629999846220016,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6363999843597412},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5965999960899353},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.5024999976158142},{"id":"https://openalex.org/keywords/protein-design","display_name":"Protein design","score":0.38199999928474426},{"id":"https://openalex.org/keywords/ligand","display_name":"Ligand (biochemistry)","score":0.336899995803833},{"id":"https://openalex.org/keywords/protein-structure-prediction","display_name":"Protein structure prediction","score":0.32420000433921814},{"id":"https://openalex.org/keywords/discrete-time-and-continuous-time","display_name":"Discrete time and continuous time","score":0.30880001187324524}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6363999843597412},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5965999960899353},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5525000095367432},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.5024999976158142},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.48829999566078186},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.43320000171661377},{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.38199999928474426},{"id":"https://openalex.org/C116569031","wikidata":"https://www.wikidata.org/wiki/Q899107","display_name":"Ligand (biochemistry)","level":3,"score":0.336899995803833},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.32420000433921814},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C2779664074","wikidata":"https://www.wikidata.org/wiki/Q3518405","display_name":"Terminal (telecommunication)","level":2,"score":0.2971000075340271},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28850001096725464},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.2874000072479248},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2851000130176544},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2773999869823456},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.27399998903274536},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.2623000144958496},{"id":"https://openalex.org/C136475424","wikidata":"https://www.wikidata.org/wiki/Q7251500","display_name":"Protein structure database","level":4,"score":0.2567000091075897},{"id":"https://openalex.org/C41685203","wikidata":"https://www.wikidata.org/wiki/Q1974042","display_name":"Docking (animal)","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C144292202","wikidata":"https://www.wikidata.org/wiki/Q898273","display_name":"Protein domain","level":3,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27413","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27413","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27413","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27413","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Proteins":[0],"perform":[1],"their":[2],"biological":[3],"functions":[4],"through":[5,88],"three-dimensional":[6],"structures":[7],"encoded":[8],"by":[9],"amino":[10],"acid":[11],"sequences,":[12],"and":[13,31,77,85,124,144,163,174],"ligand-binding":[14],"protein":[15,45,69,106,196],"co-design":[16],"requires":[17],"models":[18,33,47],"that":[19,120],"generate":[20],"sequence-structure":[21,70],"compatible":[22],"proteins":[23],"under":[24,179],"explicit":[25],"ligand":[26,83],"constraints.":[27],"Although":[28],"continuous":[29],"diffusion":[30,44,102,188],"flow-based":[32],"support":[34,185],"ligand-aware":[35,104,165],"design":[36],"in":[37,135],"coordinate":[38],"or":[39,52],"latent":[40],"spaces,":[41],"existing":[42],"discrete":[43,78,101,187],"language":[46],"mainly":[48],"operate":[49],"over":[50,93,133,168],"sequence":[51,76],"structure":[53,79],"tokens":[54,80],"without":[55],"direct":[56],"small-molecule":[57],"conditioning.":[58],"We":[59,108],"introduce":[60],"\\textbf{ProtLiD$^2$},":[61],"a":[62],"\\textbf{Prot}ein":[63],"\\textbf{L}igand-conditioned":[64],"\\textbf{D}iscrete":[65],"\\textbf{D}iffusion":[66],"model":[67],"for":[68,159,194],"co-design.":[71,197],"ProtLiD$^2$":[72,98,128,153],"jointly":[73],"generates":[74],"amino-acid":[75],"while":[81],"incorporating":[82],"chemical":[84],"geometric":[86],"information":[87],"geometry-aware":[89],"cross-attention.":[90],"Trained":[91],"on":[92],"one":[94],"million":[95],"ligand-protein":[96],"complexes,":[97],"extends":[99],"masked":[100],"to":[103,142,148,161,172,177],"functional":[105,195],"design.":[107],"further":[109],"propose":[110],"maximum":[111],"confidence-margin":[112],"guided":[113],"ReMask":[114],"decoding,":[115],"an":[116,190],"inference-time":[117],"self-correction":[118],"strategy":[119],"retains":[121],"confident":[122],"predictions":[123],"remasks":[125],"uncertain":[126],"tokens.":[127],"improves":[129,164],"global":[130],"fold":[131],"confidence":[132],"Complexa":[134],"whole-protein":[136],"design,":[137],"increasing":[138],"TM-score":[139],"from":[140,146,157,170,175],"0.672":[141],"0.802":[143],"pLDDT":[145],"64.55":[147],"73.00.":[149],"In":[150],"pocket":[151],"co-design,":[152],"reduces":[154],"active-site":[155],"BB-RMSD":[156],"3.46/3.40\u00c5":[158],"FAIR/PocketGen":[160],"1.97\u00c5,":[162],"pass":[166],"rates":[167],"PocketGen":[169],"14.86%":[171],"59.73%":[173],"6.08%":[176],"23.49%":[178],"stricter":[180],"docking":[181],"thresholds.":[182],"These":[183],"results":[184],"ligand-conditioned":[186],"as":[189],"effective":[191],"token-space":[192],"framework":[193],"Code":[198],"will":[199],"be":[200],"available":[201],"at":[202],"https://github.com/auroua/ProtLiD.":[203]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-29T00:00:00"}
