{"id":"https://openalex.org/W7134978986","doi":"https://doi.org/10.48550/arxiv.2603.08921","title":"Vision-Language Models Encode Clinical Guidelines for Concept-Based Medical Reasoning","display_name":"Vision-Language Models Encode Clinical Guidelines for Concept-Based Medical Reasoning","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134978986","doi":"https://doi.org/10.48550/arxiv.2603.08921"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.08921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.08921","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034889549","display_name":"Mohamed Harmanani","orcid":"https://orcid.org/0009-0002-4926-5221"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Harmanani, Mohamed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104245608","display_name":"Bining Long","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Long, Bining","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001905104","display_name":"Zhuoxin Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Zhuoxin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100637126","display_name":"Paul Wilson","orcid":"https://orcid.org/0009-0000-7299-8330"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wilson, Paul F. R.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093461277","display_name":"Amirhossein Sabour","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sabour, Amirhossein","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059649437","display_name":"Minh Nguyen Nhat To","orcid":"https://orcid.org/0000-0003-4035-3313"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"To, Minh Nguyen Nhat","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084753910","display_name":"G\u00e1bor Fichtinger","orcid":"https://orcid.org/0000-0002-6354-262X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fichtinger, Gabor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128714606","display_name":"Purang Abolmaesumi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abolmaesumi, Purang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125758589","display_name":"Parvin Mousavi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mousavi, Parvin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5034889549"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.34790000319480896,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.34790000319480896,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.31439998745918274,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.10239999741315842,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.833899974822998},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5485000014305115},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.4803999960422516},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4724000096321106},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.4122999906539917},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.38830000162124634},{"id":"https://openalex.org/keywords/expert-system","display_name":"Expert system","score":0.38119998574256897}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.833899974822998},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6679999828338623},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6553000211715698},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5485000014305115},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4862000048160553},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.4803999960422516},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4724000096321106},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.4122999906539917},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.38830000162124634},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.38119998574256897},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.36809998750686646},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.3465999960899353},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.3447999954223633},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33410000801086426},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.31130000948905945},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.2865999937057495},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.2791000008583069},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.08921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.08921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7562046647071838,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Concept":[0],"Bottleneck":[1],"Models":[2],"(CBMs)":[3],"are":[4,98],"a":[5,17,82,104,110],"prominent":[6],"framework":[7,85,178],"for":[8,22,54],"interpretable":[9],"AI":[10],"that":[11,39,86,141],"map":[12],"learned":[13],"visual":[14],"features":[15],"to":[16,35,122,190],"set":[18],"of":[19,161],"meaningful":[20],"concepts":[21,38],"task-specific":[23],"downstream":[24],"predictions.":[25],"Their":[26],"sequential":[27],"structure":[28],"enhances":[29,179],"transparency":[30,46],"by":[31],"connecting":[32],"model":[33,56,106,132],"predictions":[34,136],"the":[36,143],"underlying":[37],"support":[40],"them.":[41],"In":[42],"medical":[43,187],"imaging,":[44],"where":[45],"is":[47,107],"essential,":[48],"CBMs":[49],"offer":[50],"an":[51,183],"appealing":[52],"foundation":[53],"explainable":[55],"design.":[57],"However,":[58],"discrete":[59],"concept":[60,117],"representations":[61],"often":[62],"overlook":[63],"broader":[64],"clinical":[65,88,96,139],"context":[66],"such":[67],"as":[68],"diagnostic":[69,120,155],"guidelines":[70,89],"and":[71,92,103,119,128,156,165,181],"expert":[72,146],"heuristics,":[73],"reducing":[74],"reliability":[75],"in":[76],"complex":[77],"cases.":[78],"We":[79],"propose":[80],"MedCBR,":[81],"concept-based":[83,105],"reasoning":[84,93,131,147],"integrates":[87],"with":[90,109,159],"vision-language":[91],"models.":[94],"Labeled":[95],"descriptors":[97],"transformed":[99],"into":[100,137],"guideline-conformant":[101],"text,":[102],"trained":[108],"multitask":[111],"objective":[112],"combining":[113],"multimodal":[114],"contrastive":[115],"alignment,":[116],"supervision,":[118],"classification":[121],"jointly":[123],"ground":[124],"image":[125,188],"features,":[126],"concepts,":[127],"pathology.":[129],"A":[130],"then":[133],"converts":[134],"these":[135],"structured":[138],"narratives":[140],"explain":[142],"diagnosis,":[144],"emulating":[145],"based":[148],"on":[149,163,167,171],"established":[150],"guidelines.":[151],"MedCBR":[152],"achieves":[153],"superior":[154],"concept-level":[157],"performance,":[158],"AUROCs":[160],"94.2%":[162],"ultrasound":[164],"84.0%":[166],"mammography.":[168],"Further":[169],"experiments":[170],"non-medical":[172],"datasets":[173],"achieve":[174],"86.1%":[175],"accuracy.":[176],"Our":[177],"interpretability":[180],"forms":[182],"end-to-end":[184],"bridge":[185],"from":[186],"analysis":[189],"decision-making.":[191]},"counts_by_year":[],"updated_date":"2026-03-12T06:18:43.230356","created_date":"2026-03-12T00:00:00"}
