{"id":"https://openalex.org/W7160960829","doi":"https://doi.org/10.48550/arxiv.2605.10876","title":"AssayBench: An Assay-Level Virtual Cell Benchmark for LLMs and Agents","display_name":"AssayBench: An Assay-Level Virtual Cell Benchmark for LLMs and Agents","publication_year":2026,"publication_date":"2026-05-11","ids":{"openalex":"https://openalex.org/W7160960829","doi":"https://doi.org/10.48550/arxiv.2605.10876"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.10876","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10876","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.10876","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013970475","display_name":"Edward De Brouwer","orcid":"https://orcid.org/0000-0003-0608-0155"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De Brouwer, Edward","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135988778","display_name":"Carl Edwards","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Edwards, Carl","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135935849","display_name":"Alexander Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135952226","display_name":"Jenna Collier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Collier, Jenna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135924134","display_name":"Graham Heimberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heimberg, Graham","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135972679","display_name":"Xiner Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiner","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090471536","display_name":"Meena Subramaniam","orcid":"https://orcid.org/0000-0003-1534-567X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Subramaniam, Meena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057632577","display_name":"Ehsan Hajiramezanali","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hajiramezanali, Ehsan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135666240","display_name":"David Richmond","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Richmond, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029641905","display_name":"Jan-Christian H\u00fctter","orcid":"https://orcid.org/0000-0002-1219-4821"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"H\u00fctter, Jan-Christian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135969962","display_name":"Sara Mostafavi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mostafavi, Sara","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020099374","display_name":"Gabriele Scalia","orcid":"https://orcid.org/0000-0003-3305-9220"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scalia, Gabriele","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9232000112533569,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9232000112533569,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.02250000089406967,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.014700000174343586,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.8126000165939331},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.5800999999046326},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5565999746322632},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.548799991607666},{"id":"https://openalex.org/keywords/in-silico","display_name":"In silico","score":0.524399995803833},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.48260000348091125}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.8126000165939331},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6657000184059143},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.5800999999046326},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5565999746322632},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.548799991607666},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.524399995803833},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.48260000348091125},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47929999232292175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4212999939918518},{"id":"https://openalex.org/C103697762","wikidata":"https://www.wikidata.org/wiki/Q4112105","display_name":"Virtual screening","level":3,"score":0.39910000562667847},{"id":"https://openalex.org/C2780898871","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Performance metric","level":2,"score":0.38519999384880066},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C98108389","wikidata":"https://www.wikidata.org/wiki/Q412563","display_name":"CRISPR","level":3,"score":0.26969999074935913},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.26109999418258667}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.10876","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10876","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.10876","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10876","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,44,48,58,218],"machine":[3],"learning":[4],"and":[5,78,153,181,188,197],"large-scale":[6],"biological":[7,28,60],"data":[8],"collections":[9],"have":[10],"revived":[11],"the":[12,32,40,53,104,141,155],"prospect":[13],"of":[14,22,31,36,55,136],"building":[15],"a":[16,19,50,119,146,158,211],"virtual":[17,225],"cell,":[18],"computational":[20],"model":[21,51],"cellular":[23,56,137],"behavior":[24],"that":[25,98,171],"could":[26],"accelerate":[27],"discovery.":[29],"One":[30],"most":[33],"compelling":[34],"promises":[35],"this":[37,88,114,206],"vision":[38],"is":[39],"ability":[41],"to":[42,76],"perform":[43],"silico":[45,219],"phenotypic":[46,70,105,122,220],"screens,":[47],"which":[49],"predicts":[52],"effects":[54],"perturbations":[57],"unseen":[59],"contexts.":[61],"This":[62],"task":[63,144],"combines":[64],"heterogeneous":[65,165],"textual":[66],"inputs":[67],"with":[68,103],"diverse":[69],"outputs,":[71],"making":[72],"it":[73],"particularly":[74],"well-suited":[75],"LLMs":[77,184,187],"agentic":[79],"systems.":[80],"Yet,":[81],"no":[82],"standard":[83],"benchmark":[84,120],"currently":[85],"exists":[86],"for":[87,121,150,161,214],"task,":[89],"as":[90,145,194],"existing":[91,172],"efforts":[92],"focus":[93],"on":[94,205],"narrower":[95],"molecular":[96],"readouts":[97],"are":[99],"only":[100],"indirectly":[101],"aligned":[102],"endpoints":[106],"driving":[107],"many":[108],"real-world":[109],"drug":[110],"discovery":[111],"workflows.":[112],"In":[113],"work,":[115],"we":[116],"present":[117],"AssayBench,":[118],"screen":[123,142,152],"prediction,":[124],"built":[125],"from":[126,176],"1,920":[127],"publicly":[128],"available":[129],"CRISPR":[130],"screens":[131],"spanning":[132],"five":[133],"broad":[134],"classes":[135],"phenotypes.":[138],"We":[139],"formulate":[140],"prediction":[143,149],"gene":[147],"rank":[148],"each":[151],"introduce":[154],"adjusted":[156],"nDCG,":[157],"continuous":[159],"metric":[160],"comparing":[162],"performance":[163,179,204],"across":[164],"assays.":[166],"Our":[167],"extensive":[168],"evaluation":[169],"shows":[170],"methods":[173],"remain":[174],"far":[175],"empirically":[177],"estimated":[178],"ceilings":[180],"zero-shot":[182],"generalist":[183],"outperform":[185],"biology-specific":[186],"trainable":[189],"baselines.":[190],"Optimization":[191],"techniques":[192],"such":[193],"fine-tuning,":[195],"ensembling,":[196],"prompt":[198],"optimization":[199],"can":[200],"further":[201],"improve":[202],"LLM":[203],"task.":[207],"Overall,":[208],"AssayBench":[209],"offers":[210],"practical":[212],"testbed":[213],"measuring":[215],"progress":[216],"toward":[217],"screening":[221],"and,":[222],"more":[223],"broadly,":[224],"cell":[226],"models.":[227]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
