{"id":"https://openalex.org/W7140992041","doi":"https://doi.org/10.48550/arxiv.2603.25240","title":"Lingshu-Cell: A generative cellular world model for transcriptome modeling toward virtual cells","display_name":"Lingshu-Cell: A generative cellular world model for transcriptome modeling toward virtual cells","publication_year":2026,"publication_date":"2026-03-26","ids":{"openalex":"https://openalex.org/W7140992041","doi":"https://doi.org/10.48550/arxiv.2603.25240"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.25240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.25240","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130765742","display_name":"Han Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Han","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068977715","display_name":"Guo-Hua Yuan","orcid":"https://orcid.org/0000-0002-8459-3784"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Guo-Hua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101345686","display_name":"Chaohao Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Chaohao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005345630","display_name":"Tingyang Xu","orcid":"https://orcid.org/0000-0002-8487-9045"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Tingyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130798813","display_name":"Tian Bian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bian, Tian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130747461","display_name":"Hong Sheng Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Hong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130785817","display_name":"Wenbing Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wenbing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130745796","display_name":"Deli Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Deli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5104347463","display_name":"Yu Rong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rong, Yu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5130765742"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.006000000052154064,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10621","display_name":"Gene Regulatory Network Analysis","score":0.0052999998442828655,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transcriptome","display_name":"Transcriptome","score":0.560699999332428},{"id":"https://openalex.org/keywords/in-silico","display_name":"In silico","score":0.5605000257492065},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4027000069618225},{"id":"https://openalex.org/keywords/systems-biology","display_name":"Systems biology","score":0.3991999924182892},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.396699994802475},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.3928000032901764},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.3725000023841858}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5651999711990356},{"id":"https://openalex.org/C162317418","wikidata":"https://www.wikidata.org/wiki/Q252857","display_name":"Transcriptome","level":4,"score":0.560699999332428},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.5605000257492065},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5001999735832214},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4408999979496002},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4027000069618225},{"id":"https://openalex.org/C152662350","wikidata":"https://www.wikidata.org/wiki/Q815297","display_name":"Systems biology","level":2,"score":0.3991999924182892},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.396699994802475},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3928000032901764},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38760000467300415},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C137866125","wikidata":"https://www.wikidata.org/wiki/Q4299308","display_name":"Modelling biological systems","level":3,"score":0.2969000041484833},{"id":"https://openalex.org/C18431079","wikidata":"https://www.wikidata.org/wiki/Q1502169","display_name":"Gene expression profiling","level":4,"score":0.28769999742507935},{"id":"https://openalex.org/C165864922","wikidata":"https://www.wikidata.org/wiki/Q411391","display_name":"Regulation of gene expression","level":3,"score":0.26829999685287476},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C177918212","wikidata":"https://www.wikidata.org/wiki/Q803623","display_name":"Perturbation (astronomy)","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C153646914","wikidata":"https://www.wikidata.org/wiki/Q535695","display_name":"Cellular network","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.25240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.25240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modeling":[0],"cellular":[1,40,134,189],"states":[2,41,198],"and":[3,15,59,115,125,158,173,199,212],"predicting":[4,175],"their":[5],"responses":[6,177],"to":[7,131],"perturbations":[8],"are":[9],"central":[10],"challenges":[11],"in":[12,68,174,178,193,209],"computational":[13],"biology":[14],"the":[16,37,77,165,203],"development":[17],"of":[18,39,81,156,196],"virtual":[19],"cells.":[20],"Existing":[21],"foundation":[22,204],"models":[23],"for":[24,42,153,192,205],"single-cell":[25,82],"transcriptomics":[26],"provide":[27],"powerful":[28],"static":[29],"representations,":[30],"but":[31],"they":[32],"do":[33],"not":[34],"explicitly":[35],"model":[36,53,191],"distribution":[38],"generative":[43],"simulation.":[44],"Here,":[45],"we":[46],"introduce":[47],"Lingshu-Cell,":[48],"a":[49,69,187,206],"masked":[50],"discrete":[51,70],"diffusion":[52],"that":[54,73],"learns":[55],"transcriptomic":[56,83,120],"state":[57],"distributions":[58],"supports":[60],"conditional":[61],"simulation":[62,195],"under":[63],"perturbation.":[64,159],"By":[65],"operating":[66],"directly":[67],"token":[71],"space":[72],"is":[74],"compatible":[75],"with":[76,145],"sparse,":[78],"non-sequential":[79],"nature":[80],"data,":[84],"Lingshu-Cell":[85,117,147,185],"captures":[86],"complex":[87,133],"transcriptome-wide":[88],"expression":[89,110,123,151],"dependencies":[90],"across":[91],"approximately":[92],"18,000":[93],"genes":[94],"without":[95],"relying":[96],"on":[97,164],"prior":[98],"gene":[99],"selection,":[100],"such":[101],"as":[102,186],"filtering":[103],"by":[104,109,137],"high":[105],"variability":[106],"or":[107,142],"ranking":[108],"level.":[111],"Across":[112],"diverse":[113],"tissues":[114],"species,":[116],"accurately":[118],"reproduces":[119],"distributions,":[121],"marker-gene":[122],"patterns":[124],"cell-subtype":[126],"proportions,":[127],"demonstrating":[128],"its":[129],"ability":[130],"capture":[132],"heterogeneity.":[135],"Moreover,":[136],"jointly":[138],"embedding":[139],"cell":[140,197],"type":[141],"donor":[143],"identity":[144,157],"perturbation,":[146],"can":[148],"predict":[149],"whole-transcriptome":[150],"changes":[152],"novel":[154],"combinations":[155],"It":[160],"achieves":[161],"leading":[162],"performance":[163],"Virtual":[166],"Cell":[167],"Challenge":[168],"H1":[169],"genetic":[170],"perturbation":[171,200,213],"benchmark":[172],"cytokine-induced":[176],"human":[179],"PBMCs.":[180],"Together,":[181],"these":[182],"results":[183],"establish":[184],"flexible":[188],"world":[190],"silico":[194],"responses,":[201],"laying":[202],"new":[207],"paradigm":[208],"biological":[210],"discovery":[211],"screening.":[214]},"counts_by_year":[],"updated_date":"2026-03-28T06:16:51.555046","created_date":"2026-03-28T00:00:00"}
