{"id":"https://openalex.org/W7147673913","doi":"https://doi.org/10.48550/arxiv.2603.27950","title":"Scaling Atomistic Protein Binder Design with Generative Pretraining and Test-Time Compute","display_name":"Scaling Atomistic Protein Binder Design with Generative Pretraining and Test-Time Compute","publication_year":2026,"publication_date":"2026-03-30","ids":{"openalex":"https://openalex.org/W7147673913","doi":"https://doi.org/10.48550/arxiv.2603.27950"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27950","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27950","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27950","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031230520","display_name":"Kieran Didi","orcid":"https://orcid.org/0000-0001-6839-3320"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Didi, Kieran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132656332","display_name":"Zuobai Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zuobai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132558607","display_name":"Guoqing Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Guoqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032963060","display_name":"Danny Reidenbach","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reidenbach, Danny","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129655349","display_name":"Zhonglin Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Zhonglin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043633104","display_name":"Sooyoung Cha","orcid":"https://orcid.org/0000-0001-7211-4603"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cha, Sooyoung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085903755","display_name":"Tomas Geffner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geffner, Tomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088531553","display_name":"Christian Dallago","orcid":"https://orcid.org/0000-0003-4650-6181"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dallago, Christian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132633314","display_name":"Jian Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132555362","display_name":"Michael M. Bronstein","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bronstein, Michael M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132617897","display_name":"Martin Steinegger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Steinegger, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009574969","display_name":"Emine K\u00fc\u00e7\u00fckbenli","orcid":"https://orcid.org/0000-0002-0588-7750"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kucukbenli, Emine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038984764","display_name":"Arash Vahdat","orcid":"https://orcid.org/0009-0005-9476-1306"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vahdat, Arash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5032255237","display_name":"Karsten Kreis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kreis, Karsten","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5031230520"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.39969998598098755,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.39969998598098755,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11016","display_name":"Monoclonal and Polyclonal Antibodies Research","score":0.13940000534057617,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.13289999961853027,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.8288000226020813},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7141000032424927},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.6227999925613403},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.588699996471405},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4350000023841858},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.42250001430511475},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4196000099182129},{"id":"https://openalex.org/keywords/equivalence","display_name":"Equivalence (formal languages)","score":0.3849000036716461}],"concepts":[{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.8288000226020813},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7141000032424927},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.6227999925613403},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6225000023841858},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.588699996471405},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4629000127315521},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4350000023841858},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.42250001430511475},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4196000099182129},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.3849000036716461},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36660000681877136},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.3422999978065491},{"id":"https://openalex.org/C147816474","wikidata":"https://www.wikidata.org/wiki/Q169525","display_name":"Protein engineering","level":3,"score":0.34220001101493835},{"id":"https://openalex.org/C2776235265","wikidata":"https://www.wikidata.org/wiki/Q18392052","display_name":"Fragment (logic)","level":2,"score":0.337799996137619},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.33629998564720154},{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.3328999876976013},{"id":"https://openalex.org/C2780440489","wikidata":"https://www.wikidata.org/wiki/Q5227278","display_name":"Data-driven","level":2,"score":0.329800009727478},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.3174999952316284},{"id":"https://openalex.org/C184408114","wikidata":"https://www.wikidata.org/wiki/Q1502022","display_name":"Generative Design","level":3,"score":0.3167000114917755},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.31139999628067017},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.29580000042915344},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.2815000116825104},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2581000030040741},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27950","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27950","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27950","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27950","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Protein":[0],"interaction":[1],"modeling":[2,36],"is":[3,30,48],"central":[4],"to":[5,84,180],"protein":[6,70,82],"design,":[7],"which":[8],"has":[9],"been":[10],"transformed":[11],"by":[12],"machine":[13],"learning":[14],"with":[15,98,114],"applications":[16],"in":[17,136],"drug":[18],"discovery":[19],"and":[20,52,73,125,152,178,184,194],"beyond.":[21],"In":[22],"this":[23,47,102,115],"landscape,":[24],"structure-based":[25],"de":[26],"novo":[27],"binder":[28,59,138,176],"design":[29,139,186],"cast":[31],"as":[32],"either":[33],"conditional":[34],"generative":[35,116,124,150],"or":[37],"sequence":[38],"optimization":[39,113,156],"via":[40],"structure":[41],"predictors":[42],"(\"hallucination\").":[43],"We":[44,65,109,167],"argue":[45],"that":[46],"a":[49,55,87,105,130],"false":[50],"dichotomy":[51],"propose":[53],"Proteina-Complexa,":[54],"novel":[56,154],"fully":[57],"atomistic":[58],"generation":[60,71],"method":[61],"unifying":[62,118],"both":[63],"paradigms.":[64],"extend":[66],"recent":[67],"flow-based":[68],"latent":[69],"architectures":[72],"leverage":[74],"the":[75,119,134],"domain-domain":[76],"interactions":[77],"of":[78,91,121,133],"monomeric":[79],"computationally":[80],"predicted":[81],"structures":[83],"construct":[85],"Teddymer,":[86],"new":[88,131,195],"large-scale":[89],"dataset":[90],"synthetic":[92],"binder-target":[93],"pairs":[94],"for":[95],"pretraining.":[96],"Combined":[97],"high-quality":[99],"experimental":[100],"multimers,":[101],"enables":[103],"training":[104],"strong":[106],"base":[107],"model.":[108],"then":[110],"perform":[111],"inference-time":[112],"prior,":[117],"strengths":[120],"previously":[122],"distinct":[123],"hallucination":[126,161],"methods.":[127,191],"Proteina-Complexa":[128],"sets":[129],"state":[132],"art":[135],"computational":[137],"benchmarks:":[140],"it":[141],"delivers":[142],"markedly":[143],"higher":[144],"in-silico":[145],"success":[146],"rates":[147],"than":[148],"existing":[149],"approaches,":[151],"our":[153],"test-time":[155],"strategies":[157],"greatly":[158],"outperform":[159],"previous":[160],"methods":[162],"under":[163],"normalized":[164],"compute":[165],"budgets.":[166],"also":[168],"demonstrate":[169],"interface":[170],"hydrogen":[171],"bond":[172],"optimization,":[173],"fold":[174],"class-guided":[175],"generation,":[177],"extensions":[179],"small":[181],"molecule":[182],"targets":[183],"enzyme":[185],"tasks,":[187],"again":[188],"surpassing":[189],"prior":[190],"Code,":[192],"models":[193],"data":[196],"will":[197],"be":[198],"publicly":[199],"released.":[200]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-04-02T00:00:00"}
