{"id":"https://openalex.org/W7126163921","doi":"https://doi.org/10.1177/15578666251405823","title":"Deep Batch Active Learning for Protein Structure Modeling","display_name":"Deep Batch Active Learning for Protein Structure Modeling","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7126163921","doi":"https://doi.org/10.1177/15578666251405823","pmid":"https://pubmed.ncbi.nlm.nih.gov/41614412"},"language":"en","primary_location":{"id":"doi:10.1177/15578666251405823","is_oa":false,"landing_page_url":"https://doi.org/10.1177/15578666251405823","pdf_url":null,"source":{"id":"https://openalex.org/S78571599","display_name":"Journal of Computational Biology","issn_l":"1066-5277","issn":["1066-5277","1557-8666"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320443","host_organization_name":"Mary Ann Liebert, Inc.","host_organization_lineage":["https://openalex.org/P4310320443"],"host_organization_lineage_names":["Mary Ann Liebert, Inc."],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014367289","display_name":"Zexin Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zexin Xue","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124336786","display_name":"Michael Bailey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michael Bailey","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108102436","display_name":"Abhinav Gupta","orcid":null},"institutions":[{"id":"https://openalex.org/I3018075036","display_name":"Sanofi (France)","ror":"https://ror.org/02n6c9837","country_code":"FR","type":"company","lineage":["https://openalex.org/I3018075036"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Abhinav Gupta","raw_affiliation_strings":["Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA","institution_ids":["https://openalex.org/I3018075036"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124324111","display_name":"Ruijiang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I3018075036","display_name":"Sanofi (France)","ror":"https://ror.org/02n6c9837","country_code":"FR","type":"company","lineage":["https://openalex.org/I3018075036"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Ruijiang Li","raw_affiliation_strings":["Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA","institution_ids":["https://openalex.org/I3018075036"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092566342","display_name":"Alejandro Corrochano-Navarro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alejandro Corrochano-Navarro","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113232007","display_name":"Sizhen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sizhen Li","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124308767","display_name":"Lorenzo Kogler-Anele","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lorenzo Kogler-Anele","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065715141","display_name":"Qui Bo Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I3018075036","display_name":"Sanofi (France)","ror":"https://ror.org/02n6c9837","country_code":"FR","type":"company","lineage":["https://openalex.org/I3018075036"]},{"id":"https://openalex.org/I4210092243","display_name":"AstraZeneca (South Korea)","ror":"https://ror.org/00h1xaa75","country_code":"KR","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210092243"]},{"id":"https://openalex.org/I4210116875","display_name":"AstraZeneca (Brazil)","ror":"https://ror.org/026m9xy48","country_code":"BR","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210116875"]},{"id":"https://openalex.org/I4210150756","display_name":"AstraZeneca (United States)","ror":"https://ror.org/043cec594","country_code":"US","type":"company","lineage":["https://openalex.org/I105036370","https://openalex.org/I4210150756"]}],"countries":["BR","FR","KR","US"],"is_corresponding":false,"raw_author_name":"Qui Yu","raw_affiliation_strings":["Biologics Engineering, Oncology R&amp;D, AstraZeneca, Waltham, Massachusetts, USA","Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Biologics Engineering, Oncology R&amp;D, AstraZeneca, Waltham, Massachusetts, USA","institution_ids":["https://openalex.org/I4210092243","https://openalex.org/I4210150756","https://openalex.org/I4210116875"]},{"raw_affiliation_string":"Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA","institution_ids":["https://openalex.org/I3018075036"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023958187","display_name":"Heidi Rommelaere","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123153","display_name":"Sanofi (Belgium)","ror":"https://ror.org/02wnz8673","country_code":"BE","type":"company","lineage":["https://openalex.org/I3018075036","https://openalex.org/I4210123153"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Heidi Rommelaere","raw_affiliation_strings":["NANOBODY Research Platform, Sanofi R&amp;D, Sanofi, Zwijnaarde, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NANOBODY Research Platform, Sanofi R&amp;D, Sanofi, Zwijnaarde, Belgium","institution_ids":["https://openalex.org/I4210123153"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075751283","display_name":"Wander Van Breedam","orcid":"https://orcid.org/0000-0001-7755-988X"},"institutions":[{"id":"https://openalex.org/I4210123153","display_name":"Sanofi (Belgium)","ror":"https://ror.org/02wnz8673","country_code":"BE","type":"company","lineage":["https://openalex.org/I3018075036","https://openalex.org/I4210123153"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Wander Van Breedam","raw_affiliation_strings":["NANOBODY Research Platform, Sanofi R&amp;D, Sanofi, Zwijnaarde, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NANOBODY Research Platform, Sanofi R&amp;D, Sanofi, Zwijnaarde, Belgium","institution_ids":["https://openalex.org/I4210123153"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026077258","display_name":"Norbert Furtmann","orcid":"https://orcid.org/0009-0006-8226-7586"},"institutions":[{"id":"https://openalex.org/I4210138838","display_name":"Sanofi (Germany)","ror":"https://ror.org/03ytdtb31","country_code":"DE","type":"company","lineage":["https://openalex.org/I3018075036","https://openalex.org/I4210138838"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Norbert Furtmann","raw_affiliation_strings":["Large Molecule Research, Sanofi, Frankfurt, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Large Molecule Research, Sanofi, Frankfurt, Germany","institution_ids":["https://openalex.org/I4210138838"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088995400","display_name":"Joseph D. Batchelor","orcid":"https://orcid.org/0000-0002-9701-9255"},"institutions":[{"id":"https://openalex.org/I3018075036","display_name":"Sanofi (France)","ror":"https://ror.org/02n6c9837","country_code":"FR","type":"company","lineage":["https://openalex.org/I3018075036"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Joseph Batchelor","raw_affiliation_strings":["Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Large Molecule Research, Sanofi, Cambridge, Massachusetts, USA","institution_ids":["https://openalex.org/I3018075036"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099576104","display_name":"Bar-Joseph Ziv","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ziv Bar-Joseph","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124377144","display_name":"Sven Jager","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sven Jager","raw_affiliation_strings":["R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"R&amp;D Data &amp; Computational Science, Sanofi, Cambridge, Massachusetts, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":6,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5014367289"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14301547,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"33","issue":"1","first_page":"184","last_page":"200"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.3711000084877014,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.3711000084877014,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12576","display_name":"vaccines and immunoinformatics approaches","score":0.1671999990940094,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.13449999690055847,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6948000192642212},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5548999905586243},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4113999903202057},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.39820000529289246},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.3921000063419342},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.34790000319480896},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.335999995470047},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3328999876976013}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7017999887466431},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6948000192642212},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5548999905586243},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5037999749183655},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49410000443458557},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4113999903202057},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.3921000063419342},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.34790000319480896},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.335999995470047},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33480000495910645},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3328999876976013},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C143587482","wikidata":"https://www.wikidata.org/wiki/Q1543216","display_name":"Iterative and incremental development","level":2,"score":0.31139999628067017},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.30790001153945923},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C191120209","wikidata":"https://www.wikidata.org/wiki/Q908902","display_name":"Structural biology","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C2984074130","wikidata":"https://www.wikidata.org/wiki/Q73539779","display_name":"R package","level":2,"score":0.2653000056743622},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2542000114917755}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011487","descriptor_name":"Protein Conformation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1177/15578666251405823","is_oa":false,"landing_page_url":"https://doi.org/10.1177/15578666251405823","pdf_url":null,"source":{"id":"https://openalex.org/S78571599","display_name":"Journal of Computational Biology","issn_l":"1066-5277","issn":["1066-5277","1557-8666"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320443","host_organization_name":"Mary Ann Liebert, Inc.","host_organization_lineage":["https://openalex.org/P4310320443"],"host_organization_lineage_names":["Mary Ann Liebert, Inc."],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computational Biology","raw_type":"journal-article"},{"id":"pmid:41614412","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41614412","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of computational biology : a journal of computational molecular cell biology","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4976292550563812,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1855237549","https://openalex.org/W2128019145","https://openalex.org/W2150593711","https://openalex.org/W2151023586","https://openalex.org/W2395579298","https://openalex.org/W2591883888","https://openalex.org/W2949071206","https://openalex.org/W3023204497","https://openalex.org/W3042826782","https://openalex.org/W3177828909","https://openalex.org/W3190752170","https://openalex.org/W3207204660","https://openalex.org/W4285293017","https://openalex.org/W4303650187","https://openalex.org/W4310676769","https://openalex.org/W4313543542","https://openalex.org/W4367049415","https://openalex.org/W4378516410","https://openalex.org/W4391034692","https://openalex.org/W4396721167"],"related_works":[],"abstract_inverted_index":{"Molecular":[0],"structure":[1,76,150],"prediction":[2,127,165,253],"is":[3],"essential":[4],"for":[5,56,192],"understanding":[6],"therapeutic":[7],"functions":[8],"and":[9,48,84,136,209,226,229,285],"accelerating":[10],"pharmaceutical":[11],"research.":[12],"While":[13,172],"state-of-the-art":[14],"deep":[15],"learning":[16,144],"models":[17],"like":[18],"AlphaFold":[19,235],"demonstrate":[20,197,239,270],"strong":[21],"performance":[22,65,132],"on":[23,175,213,256],"general":[24],"protein":[25],"backbone":[26],"prediction,":[27],"they":[28],"struggle":[29],"with":[30,69,133,291],"critical":[31],"regions":[32,111],"of":[33,39,82,97,263],"VHH":[34,54,149,176,218],"antibodies,":[35,177],"a":[36,189,251],"novel":[37,57],"family":[38],"molecules":[40],"underrepresented":[41],"in":[42],"current":[43],"training":[44,276],"datasets.":[45],"Many":[46],"academic":[47],"industry":[49],"laboratories":[50],"can":[51,117],"generate":[52,164],"high-quality":[53],"structures":[55,105],"sequences,":[58],"presenting":[59],"an":[60,142],"opportunity":[61],"to":[62,80,152,163,238],"improve":[63,126,154],"model":[64,131,156,254,275],"through":[66,204,278],"iterative":[67,206],"fine-tuning":[68,207],"strategically":[70],"selected":[71],"new":[72],"data.":[73],"However,":[74],"experimental":[75],"determination":[77],"requires":[78],"weeks":[79],"months":[81],"effort":[83],"significant":[85],"costs":[86],"per":[87],"structure,":[88],"making":[89,184],"exhaustive":[90],"data":[91,115,170,290],"collection":[92,99],"impractical.":[93],"Randomly":[94],"curating":[95],"subset":[96],"full":[98],"yields":[100],"suboptimal":[101],"improvements,":[102],"as":[103,188,222],"many":[104,181],"provide":[106],"redundant":[107],"information":[108,293],"while":[109],"key":[110],"remain":[112],"unexplored.":[113],"Strategic":[114],"selection":[116,145,211],"identify":[118],"which":[119],"structures,":[120],"once":[121],"experimentally":[122],"determined,":[123],"will":[124],"maximally":[125,153],"accuracy,":[128],"enabling":[129],"superior":[130],"fewer":[134],"iterations":[135],"lower":[137],"costs.":[138],"We":[139,269],"propose":[140],"DEWDROP,":[141],"active":[143],"method":[146,191],"that":[147,167,260,271],"guides":[148],"curation":[151],"fine-tuned":[155],"performance.":[157],"DEWDROP":[158,185,272],"leverages":[159],"Monte":[160],"Carlo":[161],"dropout":[162],"ensembles":[166],"inform":[168],"optimal":[169],"selection.":[171],"we":[173,200,249],"focus":[174],"underrepresentation":[178],"issues":[179],"affect":[180],"molecular":[182,244,258],"domains,":[183],"broadly":[186],"applicable":[187],"model-agnostic":[190],"structural":[193,216],"biology":[194],"applications.":[195],"To":[196],"this":[198],"effectiveness,":[199],"evaluate":[201],"our":[202,223],"approach":[203],"retrospective":[205],"experiments":[208],"batch":[210,280],"analysis":[212],"two":[214],"distinct":[215],"families:":[217],"antibodies":[219],"from":[220,233],"SAbDab-nano":[221],"target":[224],"application":[225],"primary":[227],"benchmark":[228],"Mycobacterium":[230],"leprae":[231],"proteins":[232],"the":[234],"Protein":[236],"Database":[237],"broader":[240],"applicability":[241],"across":[242],"different":[243],"domains.":[245],"For":[246],"all":[247],"analyses,":[248],"use":[250],"structured":[252],"based":[255],"coarse-grain":[257],"representations":[259],"operates":[261],"independently":[262],"multiple":[264],"sequence":[265],"alignments":[266],"called":[267],"Equifold.":[268],"(1)":[273],"improves":[274],"efficiency":[277],"optimized":[279],"selection,":[281],"outperforming":[282],"baseline":[283],"methods":[284],"(2)":[286],"selects":[287],"structurally":[288],"informative":[289],"high":[292],"content.":[294]},"counts_by_year":[],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2026-02-01T00:00:00"}
