{"id":"https://openalex.org/W7152068456","doi":"https://doi.org/10.48550/arxiv.2604.05181","title":"General Multimodal Protein Design Enables DNA-Encoding of Chemistry","display_name":"General Multimodal Protein Design Enables DNA-Encoding of Chemistry","publication_year":2026,"publication_date":"2026-04-06","ids":{"openalex":"https://openalex.org/W7152068456","doi":"https://doi.org/10.48550/arxiv.2604.05181"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05181","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05181","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05181","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041633236","display_name":"Jarrid Rector-Brooks","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rector-Brooks, Jarrid","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006797728","display_name":"T Lambert","orcid":"https://orcid.org/0009-0005-8485-8729"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lambert, Th\u00e9ophile","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133173705","display_name":"Marta Skreta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Skreta, Marta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133178645","display_name":"Daniel Roth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roth, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045962323","display_name":"Yueming Long","orcid":"https://orcid.org/0009-0006-5112-7791"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Long, Yueming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133216129","display_name":"Zi-Qi Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zi-Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133160547","display_name":"Xi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133201198","display_name":"Miruna Cretu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cretu, Miruna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049122816","display_name":"Francesca-Zhoufan Li","orcid":"https://orcid.org/0000-0002-5710-9512"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Francesca-Zhoufan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114674307","display_name":"Tanvi Ganapathy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganapathy, Tanvi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133216865","display_name":"Emily Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Emily","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073468005","display_name":"Avishek Joey Bose","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bose, Avishek Joey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133213996","display_name":"Jason Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051657374","display_name":"Kirill Neklyudov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neklyudov, Kirill","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133170495","display_name":"Yoshua Bengio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bengio, Yoshua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133171485","display_name":"Alexander Tong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tong, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043841592","display_name":"Frances H. Arnold","orcid":"https://orcid.org/0000-0002-4027-364X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arnold, Frances H.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101721519","display_name":"Chenghao Liu","orcid":"https://orcid.org/0000-0001-7976-1264"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Cheng-Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":18,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11611","display_name":"Cyclopropane Reaction Mechanisms","score":0.9247000217437744,"subfield":{"id":"https://openalex.org/subfields/1605","display_name":"Organic Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11611","display_name":"Cyclopropane Reaction Mechanisms","score":0.9247000217437744,"subfield":{"id":"https://openalex.org/subfields/1605","display_name":"Organic Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10404","display_name":"Enzyme Catalysis and Immobilization","score":0.009800000116229057,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11626","display_name":"Metalloenzymes and iron-sulfur proteins","score":0.005200000014156103,"subfield":{"id":"https://openalex.org/subfields/2105","display_name":"Renewable Energy, Sustainability and the Environment"},"field":{"id":"https://openalex.org/fields/21","display_name":"Energy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/protein-design","display_name":"Protein design","score":0.7146000266075134},{"id":"https://openalex.org/keywords/mutagenesis","display_name":"Mutagenesis","score":0.5302000045776367},{"id":"https://openalex.org/keywords/enzyme","display_name":"Enzyme","score":0.515500009059906},{"id":"https://openalex.org/keywords/protein-engineering","display_name":"Protein engineering","score":0.5044999718666077},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4327000081539154},{"id":"https://openalex.org/keywords/directed-evolution","display_name":"Directed evolution","score":0.414000004529953},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.38920000195503235},{"id":"https://openalex.org/keywords/genetic-code","display_name":"Genetic code","score":0.3714999854564667},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.3677999973297119}],"concepts":[{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.7146000266075134},{"id":"https://openalex.org/C16318435","wikidata":"https://www.wikidata.org/wiki/Q149299","display_name":"Mutagenesis","level":4,"score":0.5302000045776367},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5260000228881836},{"id":"https://openalex.org/C181199279","wikidata":"https://www.wikidata.org/wiki/Q8047","display_name":"Enzyme","level":2,"score":0.515500009059906},{"id":"https://openalex.org/C147816474","wikidata":"https://www.wikidata.org/wiki/Q169525","display_name":"Protein engineering","level":3,"score":0.5044999718666077},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.4797999858856201},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4327000081539154},{"id":"https://openalex.org/C9418097","wikidata":"https://www.wikidata.org/wiki/Q440681","display_name":"Directed evolution","level":4,"score":0.414000004529953},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39410001039505005},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.38920000195503235},{"id":"https://openalex.org/C10853874","wikidata":"https://www.wikidata.org/wiki/Q180618","display_name":"Genetic code","level":3,"score":0.3714999854564667},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.35850000381469727},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C171250308","wikidata":"https://www.wikidata.org/wiki/Q11468","display_name":"Nanotechnology","level":1,"score":0.3287000060081482},{"id":"https://openalex.org/C84211826","wikidata":"https://www.wikidata.org/wiki/Q5260078","display_name":"Deoxyribozyme","level":3,"score":0.31929999589920044},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3091999888420105},{"id":"https://openalex.org/C191503008","wikidata":"https://www.wikidata.org/wiki/Q16007026","display_name":"Biocatalysis","level":4,"score":0.298799991607666},{"id":"https://openalex.org/C2779379725","wikidata":"https://www.wikidata.org/wiki/Q2914572","display_name":"Artificial enzyme","level":3,"score":0.29510000348091125},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.28439998626708984},{"id":"https://openalex.org/C2779222958","wikidata":"https://www.wikidata.org/wiki/Q45422","display_name":"Yeast","level":2,"score":0.28380000591278076},{"id":"https://openalex.org/C2993809622","wikidata":"https://www.wikidata.org/wiki/Q4300350","display_name":"Protein chemistry","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C110332635","wikidata":"https://www.wikidata.org/wiki/Q629498","display_name":"Genetic programming","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C191908910","wikidata":"https://www.wikidata.org/wiki/Q862838","display_name":"Synthetic biology","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2556000053882599},{"id":"https://openalex.org/C2908542902","wikidata":"https://www.wikidata.org/wiki/Q440681","display_name":"Directed Molecular Evolution","level":5,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05181","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05181","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05181","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05181","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Evolution":[0],"is":[1,145],"an":[2],"extraordinary":[3],"engine":[4],"for":[5,46],"enzymatic":[6],"diversity,":[7],"yet":[8],"the":[9,137],"chemistry":[10],"it":[11],"has":[12],"explored":[13],"remains":[14],"a":[15,49,113,129],"narrow":[16],"slice":[17],"of":[18,107,112,140],"what":[19],"DNA":[20],"can":[21,26,121],"encode.":[22],"Deep":[23],"generative":[24],"models":[25],"design":[27,115],"new":[28],"proteins":[29],"that":[30,52,68,118],"bind":[31],"ligands,":[32],"but":[33],"none":[34],"have":[35],"created":[36],"enzymes":[37,83,89],"without":[38],"pre-specifying":[39],"catalytic":[40],"residues.":[41],"We":[42],"introduce":[43],"DISCO":[44,79,135],"(DIffusion":[45],"Sequence-structure":[47],"CO-design),":[48],"multimodal":[50],"model":[51],"co-designs":[53],"protein":[54],"sequence":[55],"and":[56,99],"3D":[57],"structure":[58],"around":[59],"arbitrary":[60],"biomolecules,":[61],"as":[62,64],"well":[63],"inference-time":[65],"scaling":[66],"methods":[67],"optimize":[69],"objectives":[70],"across":[71],"both":[72],"modalities.":[73],"Conditioned":[74],"solely":[75],"on":[76],"reactive":[77],"intermediates,":[78],"designs":[80],"diverse":[81],"heme":[82],"with":[84,102],"novel":[85],"active-site":[86],"geometries.":[87],"These":[88],"catalyze":[90],"new-to-nature":[91],"carbene-transfer":[92],"reactions,":[93],"including":[94],"alkene":[95],"cyclopropanation,":[96],"spirocyclopropanation,":[97],"B-H,":[98],"C(sp$^3$)-H":[100],"insertions,":[101],"high":[103],"activities":[104],"exceeding":[105],"those":[106],"engineered":[108],"enzymes.":[109],"Random":[110],"mutagenesis":[111],"selected":[114],"further":[116],"confirmed":[117],"enzyme":[119],"activity":[120],"be":[122],"improved":[123],"through":[124],"directed":[125],"evolution.":[126],"By":[127],"providing":[128],"scalable":[130],"route":[131],"to":[132],"evolvable":[133],"enzymes,":[134],"broadens":[136],"potential":[138],"scope":[139],"genetically":[141],"encodable":[142],"transformations.":[143],"Code":[144],"available":[146],"at":[147],"https://github.com/DISCO-design/DISCO.":[148]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-09T00:00:00"}
