{"id":"https://openalex.org/W4407178999","doi":"https://doi.org/10.48550/arxiv.2502.01535","title":"VisTA: Vision-Text Alignment Model with Contrastive Learning using Multimodal Data for Evidence-Driven, Reliable, and Explainable Alzheimer's Disease Diagnosis","display_name":"VisTA: Vision-Text Alignment Model with Contrastive Learning using Multimodal Data for Evidence-Driven, Reliable, and Explainable Alzheimer's Disease Diagnosis","publication_year":2025,"publication_date":"2025-02-03","ids":{"openalex":"https://openalex.org/W4407178999","doi":"https://doi.org/10.48550/arxiv.2502.01535"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2502.01535","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01535","pdf_url":"https://arxiv.org/pdf/2502.01535","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2502.01535","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086574827","display_name":"Duy-Cat Can","orcid":"https://orcid.org/0000-0002-6861-2893"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Can, Duy-Cat","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109242674","display_name":"Linh D. Dang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dang, Linh D.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001447018","display_name":"Quang-Huy Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Quang-Huy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116164082","display_name":"Dang Minh Ly","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ly, Dang Minh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109297653","display_name":"Huang Ha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ha, Huong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117619760","display_name":"Guillaume Blanc","orcid":"https://orcid.org/0000-0003-4109-726X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Blanc, Guillaume","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074236126","display_name":"Oliver Y. Ch\u00e9n","orcid":"https://orcid.org/0000-0002-5696-3127"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ch\u00e9n, Oliver Y.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100387323","display_name":"Thanh Binh Nguyen","orcid":"https://orcid.org/0000-0002-2260-8186"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Binh T.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5086574827"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9695000052452087,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9695000052452087,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.921500027179718,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/disease","display_name":"Disease","score":0.4804248809814453},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47994354367256165},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4636930227279663},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4055213928222656},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.36615294218063354},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3289756178855896},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.17616847157478333},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.12154319882392883},{"id":"https://openalex.org/keywords/pathology","display_name":"Pathology","score":0.04718828201293945}],"concepts":[{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.4804248809814453},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47994354367256165},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4636930227279663},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4055213928222656},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.36615294218063354},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3289756178855896},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.17616847157478333},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.12154319882392883},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.04718828201293945}],"mesh":[],"locations_count":4,"locations":[{"id":"pmh:oai:arXiv.org:2502.01535","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01535","pdf_url":"https://arxiv.org/pdf/2502.01535","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:serval.unil.ch:BIB_44488410E4A1","is_oa":true,"landing_page_url":"https://serval.unil.ch/notice/serval:BIB_44488410E4A1","pdf_url":"https://iris.unil.ch/bitstreams/f7368346-cd9a-423d-9ec5-6fbb5a103477/download","source":{"id":"https://openalex.org/S4306401797","display_name":"SERVAL (Universit\u00e9 de Lausanne)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210093590","host_organization_name":"Swiss School of Archaeology in Greece","host_organization_lineage":["https://openalex.org/I4210093590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/submittedVersion"},{"id":"pmh:oai:iris.unil.ch:iris/266810","is_oa":true,"landing_page_url":"https://iris.unil.ch/handle/iris/266810","pdf_url":null,"source":{"id":"https://openalex.org/S7407055444","display_name":"IRIS","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"other"},{"id":"doi:10.48550/arxiv.2502.01535","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2502.01535","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2502.01535","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01535","pdf_url":"https://arxiv.org/pdf/2502.01535","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407178999.pdf","grobid_xml":"https://content.openalex.org/works/W4407178999.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2931662336","https://openalex.org/W2077865380","https://openalex.org/W3006817050","https://openalex.org/W4401768695","https://openalex.org/W2765597752","https://openalex.org/W2134894512","https://openalex.org/W2083375246","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Objective:":[0],"Assessing":[1],"Alzheimer's":[2],"disease":[3,48],"(AD)":[4],"using":[5,76],"high-dimensional":[6],"radiology":[7],"images":[8,81,155],"is":[9],"clinically":[10],"important":[11],"but":[12],"challenging.":[13],"Although":[14],"Artificial":[15],"Intelligence":[16],"(AI)":[17],"has":[18],"advanced":[19],"AD":[20,65,122],"diagnosis,":[21],"it":[22,75],"remains":[23],"unclear":[24],"how":[25],"to":[26,46,79,115,152],"design":[27],"AI":[28],"models":[29],"embracing":[30],"predictability":[31],"and":[32,50,73,85,101,120,135,167,174,184,190,203,209,223,237],"explainability.":[33],"Here,":[34],"we":[35,68,91,128,142],"propose":[36],"VisTA,":[37,90],"a":[38,93],"multimodal":[39],"language-vision":[40],"model":[41],"assisted":[42],"by":[43,104],"contrastive":[44,77],"learning,":[45],"optimize":[47,233],"prediction":[49],"evidence-based,":[51],"interpretable":[52],"explanations":[53,145,217],"for":[54,64,132,157,165],"clinical":[55,235],"decision-making.":[56],"Methods:":[57],"We":[58],"developed":[59],"VisTA":[60,70,107,160,180,199,232],"(Vision-Text":[61],"Alignment":[62],"Model)":[63],"diagnosis.":[66],"Architecturally,":[67],"built":[69],"from":[71,193,212],"BiomedCLIP":[72],"fine-tuned":[74],"learning":[78],"align":[80],"with":[82,146,220],"verified":[83,103],"abnormalities":[84],"their":[86],"descriptions.":[87],"To":[88,124,138],"train":[89],"used":[92,156,162],"constructed":[94],"reference":[95,116],"dataset":[96],"containing":[97],"images,":[98],"abnormality":[99,112,133,172,178],"types,":[100],"descriptions":[102],"medical":[105],"experts.":[106],"produces":[108],"four":[109],"outputs:":[110],"predicted":[111],"type,":[113],"similarity":[114],"cases,":[117],"evidence-driven":[118],"explanation,":[119],"final":[121],"diagnoses.":[123],"illustrate":[125],"VisTA's":[126,140],"efficacy,":[127],"reported":[129],"accuracy":[130,183,202],"metrics":[131],"retrieval":[134,173],"dementia":[136,175,197],"prediction.":[137,176],"demonstrate":[139],"explainability,":[141],"compared":[143],"its":[144],"human":[147,221],"experts'":[148,222],"explanations.":[149],"Results:":[150],"Compared":[151],"15":[153],"million":[154],"baseline":[158,194,213],"pretraining,":[159],"only":[161],"170":[163],"samples":[164],"fine-tuning":[166],"obtained":[168],"significant":[169],"improvement":[170],"in":[171],"For":[177,196],"retrieval,":[179],"reached":[181],"74%":[182],"an":[185,204],"AUC":[186,205],"of":[187,206],"0.87":[188],"(26%":[189],"0.74,":[191],"respectively,":[192,211],"models).":[195,214],"prediction,":[198,234],"achieved":[200],"88%":[201],"0.82":[207],"(30%":[208],"0.57,":[210],"The":[215],"generated":[216],"agreed":[218],"strongly":[219],"provided":[224],"insights":[225],"into":[226],"the":[227],"diagnostic":[228],"process.":[229],"Taken":[230],"together,":[231],"reasoning,":[236],"explanation.":[238]},"counts_by_year":[],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-10-10T00:00:00"}
