{"id":"https://openalex.org/W7151235018","doi":"https://doi.org/10.48550/arxiv.2604.03635","title":"A Generative Foundation Model for Multimodal Histopathology","display_name":"A Generative Foundation Model for Multimodal Histopathology","publication_year":2026,"publication_date":"2026-04-04","ids":{"openalex":"https://openalex.org/W7151235018","doi":"https://doi.org/10.48550/arxiv.2604.03635"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03635","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03635","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03635","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055991162","display_name":"Jinxi Xiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xiang, Jinxi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133139263","display_name":"Mingjie Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Mingjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033870400","display_name":"Siyu Hou","orcid":"https://orcid.org/0000-0002-5300-6495"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hou, Siyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133093763","display_name":"Yijiang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yijiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133071765","display_name":"Xiangde Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Xiangde","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034586348","display_name":"Yuanfeng Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Yuanfeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133143213","display_name":"Xiang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133139768","display_name":"Ehsan Adeli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adeli, Ehsan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133146403","display_name":"Akshay Chaudhari","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chaudhari, Akshay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133120846","display_name":"Curtis P. Langlotz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Langlotz, Curtis P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055107125","display_name":"Kilian M. Pohl","orcid":"https://orcid.org/0000-0001-5416-5159"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pohl, Kilian M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121965092","display_name":"Ruijiang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Ruijiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5055991162"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.9370999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.9370999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.016200000420212746,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0066999997943639755,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6434000134468079},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.5066999793052673},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.48429998755455017},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.4569999873638153},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.3781999945640564},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3637999892234802},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.31520000100135803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6628000140190125},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6434000134468079},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6277999877929688},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5397999882698059},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.5066999793052673},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.4569999873638153},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3781999945640564},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3637999892234802},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35359999537467957},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.31520000100135803},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C2777522853","wikidata":"https://www.wikidata.org/wiki/Q5276128","display_name":"Digital pathology","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2581999897956848},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03635","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03635","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03635","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03635","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"diagnosis":[1],"and":[2,11,28,70,77,104,127,148,193],"treatment":[3],"of":[4],"complex":[5],"diseases":[6],"require":[7],"integrating":[8],"histological,":[9],"molecular,":[10],"clinical":[12,78],"data,":[13],"yet":[14],"in":[15],"practice":[16],"these":[17],"modalities":[18,38,218],"are":[19],"often":[20],"incomplete":[21],"owing":[22],"to":[23,35,145,155,191],"tissue":[24,134],"scarcity,":[25],"assay":[26],"cost,":[27],"workflow":[29],"constraints.":[30],"Existing":[31],"computational":[32,227],"approaches":[33],"attempt":[34],"impute":[36],"missing":[37],"from":[39],"available":[40],"data":[41,159],"but":[42],"rely":[43],"on":[44,48,94],"task-specific":[45,123],"models":[46,147],"trained":[47],"narrow,":[49],"single":[50],"source-target":[51],"pairs,":[52,103],"limiting":[53],"their":[54],"generalizability.":[55],"Here":[56],"we":[57],"introduce":[58],"MuPD":[59,113,130,165,187],"(Multimodal":[60],"Pathology":[61],"Diffusion),":[62],"a":[63,81,86,184,209,225],"generative":[64,212],"foundation":[65],"model":[66,213],"that":[67,208],"embeds":[68],"hematoxylin":[69],"eosin":[71],"(H&amp;E)-stained":[72],"histology,":[73],"molecular":[74],"RNA":[75],"profiles,":[76],"text":[79],"into":[80],"shared":[82],"latent":[83],"space":[84],"through":[85,157],"diffusion":[87],"transformer":[88],"with":[89,119,171],"decoupled":[90],"cross-modal":[91,116],"attention.":[92],"Pretrained":[93],"100":[95],"million":[96,101,106],"histology":[97,163],"image":[98],"patches,":[99],"1.6":[100],"text-histology":[102],"10.8":[105],"RNA-histology":[107],"pairs":[108],"spanning":[109],"34":[110],"human":[111],"organs,":[112],"supports":[114],"diverse":[115],"synthesis":[117],"tasks":[118],"minimal":[120],"or":[121],"no":[122],"fine-tuning.":[124],"For":[125,161],"text-conditioned":[126],"image-to-image":[128],"generation,":[129,164],"synthesizes":[131],"histologically":[132],"faithful":[133],"architectures,":[135],"reducing":[136],"Fr\u00e9chet":[137],"inception":[138],"distance":[139],"(FID)":[140],"scores":[141],"by":[142,153,168,200],"50%":[143],"relative":[144],"domain-specific":[146],"improving":[149,196],"few-shot":[150],"classification":[151],"accuracy":[152],"up":[154],"47%":[156],"synthetic":[158],"augmentation.":[160],"RNA-conditioned":[162],"reduces":[166],"FID":[167],"23%":[169],"compared":[170],"the":[172],"next-best":[173],"method":[174],"while":[175],"preserving":[176],"cell-type":[177],"distributions":[178],"across":[179,215],"five":[180],"cancer":[181],"types.":[182],"As":[183],"virtual":[185],"stainer,":[186],"translates":[188],"H&amp;E":[189],"images":[190],"immunohistochemistry":[192],"multiplex":[194],"immunofluorescence,":[195],"average":[197],"marker":[198],"correlation":[199],"37%":[201],"over":[202],"existing":[203],"approaches.":[204],"These":[205],"results":[206],"demonstrate":[207],"single,":[210],"unified":[211],"pretrained":[214],"heterogeneous":[216],"pathology":[217],"can":[219],"substantially":[220],"outperform":[221],"specialized":[222],"alternatives,":[223],"providing":[224],"scalable":[226],"framework":[228],"for":[229],"multimodal":[230],"histopathology.":[231]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-08T00:00:00"}
