{"id":"https://openalex.org/W4417062421","doi":"https://doi.org/10.1145/3768322.3769031","title":"Benchmarking and Consensus Ranking of Inverse Folding Models for Protein-Ligand Interface Design","display_name":"Benchmarking and Consensus Ranking of Inverse Folding Models for Protein-Ligand Interface Design","publication_year":2025,"publication_date":"2025-10-11","ids":{"openalex":"https://openalex.org/W4417062421","doi":"https://doi.org/10.1145/3768322.3769031"},"language":"en","primary_location":{"id":"doi:10.1145/3768322.3769031","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3768322.3769031","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3768322.3769031","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the 16th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3768322.3769031","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103713337","display_name":"Yao Wei","orcid":"https://orcid.org/0009-0008-8683-8459"},"institutions":[{"id":"https://openalex.org/I189158943","display_name":"University of Milan","ror":"https://ror.org/00wjc7c48","country_code":"IT","type":"education","lineage":["https://openalex.org/I189158943"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Yao Wei","raw_affiliation_strings":["Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy"],"raw_orcid":"https://orcid.org/0009-0008-8683-8459","affiliations":[{"raw_affiliation_string":"Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy","institution_ids":["https://openalex.org/I189158943"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039901296","display_name":"Uliano Guerrini","orcid":"https://orcid.org/0000-0001-7291-5160"},"institutions":[{"id":"https://openalex.org/I189158943","display_name":"University of Milan","ror":"https://ror.org/00wjc7c48","country_code":"IT","type":"education","lineage":["https://openalex.org/I189158943"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Uliano Guerrini","raw_affiliation_strings":["Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy"],"raw_orcid":"https://orcid.org/0000-0001-7291-5160","affiliations":[{"raw_affiliation_string":"Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy","institution_ids":["https://openalex.org/I189158943"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029213430","display_name":"Ivano Eberini","orcid":"https://orcid.org/0000-0001-5521-3829"},"institutions":[{"id":"https://openalex.org/I189158943","display_name":"University of Milan","ror":"https://ror.org/00wjc7c48","country_code":"IT","type":"education","lineage":["https://openalex.org/I189158943"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Ivano Eberini","raw_affiliation_strings":["Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy"],"raw_orcid":"https://orcid.org/0000-0001-5521-3829","affiliations":[{"raw_affiliation_string":"Department of Pharmacological and Biomolecular Sciences, University of Milan, Milan, MI, Italy","institution_ids":["https://openalex.org/I189158943"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103713337"],"corresponding_institution_ids":["https://openalex.org/I189158943"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.33109333,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5019000172615051,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5019000172615051,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.18070000410079956,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.041099999099969864,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6669999957084656},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6225000023841858},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.42329999804496765},{"id":"https://openalex.org/keywords/inverse","display_name":"Inverse","score":0.41819998621940613},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4074000120162964},{"id":"https://openalex.org/keywords/folding","display_name":"Folding (DSP implementation)","score":0.39100000262260437},{"id":"https://openalex.org/keywords/protein-design","display_name":"Protein design","score":0.3262999951839447},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.32269999384880066}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6689000129699707},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6669999957084656},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6225000023841858},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5551999807357788},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4749999940395355},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4074000120162964},{"id":"https://openalex.org/C2776545253","wikidata":"https://www.wikidata.org/wiki/Q5464292","display_name":"Folding (DSP implementation)","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36739999055862427},{"id":"https://openalex.org/C152769699","wikidata":"https://www.wikidata.org/wiki/Q410814","display_name":"Protein design","level":3,"score":0.3262999951839447},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.32269999384880066},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.2912999987602234},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C66153294","wikidata":"https://www.wikidata.org/wiki/Q899291","display_name":"CASP","level":4,"score":0.2766999900341034},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.27300000190734863},{"id":"https://openalex.org/C204328495","wikidata":"https://www.wikidata.org/wiki/Q847556","display_name":"Protein folding","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26600000262260437},{"id":"https://openalex.org/C83282275","wikidata":"https://www.wikidata.org/wiki/Q7435350","display_name":"Scoring algorithm","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.25679999589920044}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3768322.3769031","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3768322.3769031","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3768322.3769031","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the 16th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},{"id":"pmh:oai:air.unimi.it:2434/1203255","is_oa":true,"landing_page_url":"https://hdl.handle.net/2434/1203255","pdf_url":null,"source":{"id":"https://openalex.org/S4306400516","display_name":"Archivio Istituzionale della Ricerca (Universita Degli Studi Di Milano)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I189158943","host_organization_name":"University of Milan","host_organization_lineage":["https://openalex.org/I189158943"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/bookPart"}],"best_oa_location":{"id":"doi:10.1145/3768322.3769031","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3768322.3769031","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3768322.3769031","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the 16th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6855854724","display_name":"Metal-containing Radical Enzymes","funder_award_id":"101073546","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320321873","display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","ror":"https://ror.org/0166hxq48"},{"id":"https://openalex.org/F4320334322","display_name":"HORIZON EUROPE Framework Programme","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4417062421.pdf","grobid_xml":"https://content.openalex.org/works/W4417062421.grobid-xml"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W2016610222","https://openalex.org/W2033969841","https://openalex.org/W2052030759","https://openalex.org/W2079995754","https://openalex.org/W2098949725","https://openalex.org/W2103994532","https://openalex.org/W2557706956","https://openalex.org/W2885392370","https://openalex.org/W3130943755","https://openalex.org/W3133458480","https://openalex.org/W3177828909","https://openalex.org/W3179412555","https://openalex.org/W4284685307","https://openalex.org/W4295014386","https://openalex.org/W4299702438","https://openalex.org/W4327550249","https://openalex.org/W4383957026","https://openalex.org/W4388718657","https://openalex.org/W4396721167","https://openalex.org/W4400985732","https://openalex.org/W4401831880"],"related_works":[],"abstract_inverted_index":{"Machine":[0],"learning":[1],"has":[2],"advanced":[3],"the":[4,21,30,73,152],"progress":[5],"of":[6,16,23,33,157],"protein":[7,35,159],"design,":[8],"also":[9],"enabling":[10],"more":[11],"efficient":[12],"and":[13,63,86,115,122,137,155],"accurate":[14],"modeling":[15],"protein-ligand":[17,70],"interfaces.":[18],"Due":[19],"to":[20,67,92],"complexity":[22],"biological":[24],"systems,":[25],"selecting":[26],"optimal":[27],"candidates":[28],"from":[29,72],"heterogeneous":[31,94],"outputs":[32],"generative":[34],"design":[36,79,143],"tools":[37],"remains":[38],"a":[39,47,82,88,98,129],"persistent":[40],"challenge.":[41],"In":[42,128],"this":[43],"work,":[44],"we":[45],"introduce":[46],"consensus":[48,147],"ranking":[49,148],"framework":[50],"that":[51,104,146],"integrates":[52],"five":[53],"state-of-the-art":[54],"inverse":[55],"folding":[56],"models":[57],"\u2014":[58,65],"ProteinMPNN,":[59],"LigandMPNN,":[60],"ESM-IF1,":[61],"CARBonAra,":[62],"ProRefiner":[64],"applied":[66],"25,716":[68],"curated":[69],"complexes":[71],"BioLip":[74],"database.":[75],"Our":[76],"approach":[77],"frames":[78],"selection":[80],"as":[81,118],"supervised":[83],"learning-to-rank":[84],"problem":[85],"leverages":[87],"LightGBM-based":[89],"LambdaMART":[90],"model":[91,109],"fuse":[93],"scoring":[95],"features":[96],"into":[97],"unified":[99],"ranking.":[100],"We":[101],"pointed":[102],"out":[103],"consensus-ranked":[105],"sequences":[106],"outperform":[107],"individual":[108],"selections":[110],"in":[111],"stability,":[112],"binding":[113],"affinity,":[114],"structural":[116],"fidelity,":[117],"evaluated":[119],"using":[120],"Schr\u00f6dinger":[121],"MOE":[123],"free":[124],"energy":[125],"difference":[126],"calculations.":[127],"case":[130],"study":[131],"on":[132],"three":[133],"enzymes":[134],"(NOV1,":[135],"CYP153A,":[136],"LCD),":[138],"our":[139],"method":[140],"consistently":[141],"improves":[142],"quality,":[144],"suggesting":[145],"can":[149],"significantly":[150],"enhance":[151],"success":[153],"rate":[154],"efficiency":[156],"AI-driven":[158],"engineering.":[160]},"counts_by_year":[],"updated_date":"2026-03-13T14:20:09.374765","created_date":"2025-12-05T00:00:00"}
