{"id":"https://openalex.org/W7138975949","doi":"https://doi.org/10.48550/arxiv.2603.17380","title":"SCALE:Scalable Conditional Atlas-Level Endpoint transport for virtual cell perturbation prediction","display_name":"SCALE:Scalable Conditional Atlas-Level Endpoint transport for virtual cell perturbation prediction","publication_year":2026,"publication_date":"2026-03-18","ids":{"openalex":"https://openalex.org/W7138975949","doi":"https://doi.org/10.48550/arxiv.2603.17380"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.17380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.17380","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129757221","display_name":"Shuizhou Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Shuizhou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063286602","display_name":"Lang Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Lang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129875517","display_name":"Kedu Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Kedu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129914580","display_name":"Songming Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Songming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129861331","display_name":"Hao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130129041","display_name":"Wenxuan Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wenxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130212149","display_name":"Sheng Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Sheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130083575","display_name":"Quan Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Quan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129849981","display_name":"Qin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Qin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102884884","display_name":"Lei Bai","orcid":"https://orcid.org/0000-0001-9960-4098"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129931175","display_name":"Siqi Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Siqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5060075172","display_name":"Zhangyang Gao","orcid":"https://orcid.org/0000-0003-1026-6083"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Zhangyang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5129757221"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.41940000653266907,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.41940000653266907,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.39340001344680786,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10621","display_name":"Gene Regulatory Network Analysis","score":0.034699998795986176,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7281000018119812},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6366000175476074},{"id":"https://openalex.org/keywords/perturbation","display_name":"Perturbation (astronomy)","score":0.5475000143051147},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.4113999903202057},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.2985999882221222},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.29820001125335693},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.296099990606308},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.2865000069141388}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7281000018119812},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6700999736785889},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6366000175476074},{"id":"https://openalex.org/C177918212","wikidata":"https://www.wikidata.org/wiki/Q803623","display_name":"Perturbation (astronomy)","level":2,"score":0.5475000143051147},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.4113999903202057},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38589999079704285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38100001215934753},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33469998836517334},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.31040000915527344},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2985999882221222},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.296099990606308},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2865000069141388},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2849000096321106},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C2986056383","wikidata":"https://www.wikidata.org/wiki/Q556030","display_name":"Power flow","level":4,"score":0.2648000121116638},{"id":"https://openalex.org/C103697762","wikidata":"https://www.wikidata.org/wiki/Q4112105","display_name":"Virtual screening","level":3,"score":0.262800008058548},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.25609999895095825},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.17380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.17380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6350771188735962,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Virtual":[0],"cell":[1,71],"models":[2],"aim":[3],"to":[4,14],"enable":[5],"in":[6,42],"silico":[7],"experimentation":[8],"by":[9,31,181,186],"predicting":[10],"how":[11],"cells":[12,197],"respond":[13],"genetic,":[15],"chemical,":[16],"or":[17],"cytokine":[18],"perturbations":[19],"from":[20],"single-cell":[21],"measurements.":[22],"In":[23,58],"practice,":[24],"however,":[25],"large-scale":[26,65],"perturbation":[27,72,120,151],"prediction":[28,73,121],"remains":[29],"constrained":[30],"three":[32],"coupled":[33],"bottlenecks:":[34],"inefficient":[35],"training":[36,85,146],"and":[37,47,86,96,104,125,147,183,214],"inference":[38,87,107],"pipelines,":[39],"unstable":[40],"modeling":[41],"high-dimensional":[43],"sparse":[44],"expression":[45],"space,":[46],"evaluation":[48],"protocols":[49],"that":[50,74,89,133,194],"overemphasize":[51],"reconstruction-like":[52],"accuracy":[53],"while":[54],"underestimating":[55],"biological":[56],"fidelity.":[57],"this":[59,175],"work":[60],"we":[61,81,118,154],"present":[62],"a":[63,83,129,161],"specialized":[64],"foundation":[66],"model":[67,157,178],"SCALE":[68],"for":[69],"virtual":[70,196],"addresses":[75],"the":[76,109,156,206],"above":[77],"limitations":[78],"jointly.":[79],"First,":[80],"build":[82],"BioNeMo-based":[84],"framework":[88],"substantially":[90],"improves":[91,179],"data":[92],"throughput,":[93],"distributed":[94],"scalability,":[95],"deployment":[97],"efficiency,":[98],"yielding":[99],"12.51*":[100],"speedup":[101],"on":[102,106,158,166],"pretrain":[103],"1.29*":[105],"over":[108,188],"prior":[110],"SOTA":[111],"pipeline":[112],"under":[113],"matched":[114],"system":[115],"settings.":[116],"Second,":[117],"formulate":[119],"as":[122],"conditional":[123],"transport":[124,212],"implement":[126],"it":[127],"with":[128,138],"set-aware":[130],"flow":[131],"architecture":[132],"couples":[134],"LLaMA-based":[135],"cellular":[136],"encoding":[137],"endpoint-oriented":[139],"supervision.":[140],"This":[141],"design":[142],"yields":[143],"more":[144],"stable":[145,211],"stronger":[148],"recovery":[149],"of":[150,208],"effects.":[152],"Third,":[153],"evaluate":[155],"Tahoe-100M":[159],"using":[160],"rigorous":[162],"cell-level":[163],"protocol":[164],"centered":[165],"biologically":[167,215],"meaningful":[168],"metrics":[169],"rather":[170],"than":[171],"reconstruction":[172],"alone.":[173],"On":[174],"benchmark,":[176],"our":[177],"PDCorr":[180],"12.02%":[182],"DE":[184],"Overlap":[185],"10.66%":[187],"STATE.":[189],"Together,":[190],"these":[191],"results":[192],"suggest":[193],"advancing":[195],"requires":[198],"not":[199],"only":[200],"better":[201],"generative":[202],"objectives,":[203],"but":[204],"also":[205],"co-design":[207],"scalable":[209],"infrastructure,":[210],"modeling,":[213],"faithful":[216],"evaluation.":[217]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
