{"id":"https://openalex.org/W7140093486","doi":"https://doi.org/10.18653/v1/2026.eacl-long.197","title":"Enhancing the Safety of Medical Vision-Language Models by Synthetic Demonstrations","display_name":"Enhancing the Safety of Medical Vision-Language Models by Synthetic Demonstrations","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7140093486","doi":"https://doi.org/10.18653/v1/2026.eacl-long.197"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2026.eacl-long.197","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-long.197","pdf_url":"https://aclanthology.org/2026.eacl-long.197.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2026.eacl-long.197.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040852802","display_name":"Zhiyu Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhiyu Xue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130382938","display_name":"Reza Abbasi-Asl","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reza Abbasi-Asl","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130395512","display_name":"Ramtin Pedarsani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramtin Pedarsani","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38451263,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4207","last_page":"4220"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.35670000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.35670000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.2745000123977661,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.04740000143647194,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.24740000069141388},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.24629999697208405},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.23890000581741333},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.23720000684261322},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.23409999907016754}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48570001125335693},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3052000105381012},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2896000146865845},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.28459998965263367},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.24740000069141388},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.24629999697208405},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.23890000581741333},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.23720000684261322},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.23409999907016754},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.22059999406337738}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2026.eacl-long.197","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-long.197","pdf_url":"https://aclanthology.org/2026.eacl-long.197.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2026.eacl-long.197","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-long.197","pdf_url":"https://aclanthology.org/2026.eacl-long.197.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7140093486.pdf","grobid_xml":"https://content.openalex.org/works/W7140093486.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generative":[0],"medical":[1,23,103],"vision-language":[2],"models":[3],"(Med-VLMs)":[4],"are":[5],"primarily":[6],"designed":[7],"to":[8,76,90],"generate":[9],"complex":[10],"textual":[11,99],"information":[12],"(e.g.,":[13,22,28],"diagnostic":[14],"reports)":[15],"from":[16,107],"multimodal":[17],"inputs":[18],"including":[19],"vision":[20],"modality":[21,27],"images)":[24],"and":[25,98,152],"language":[26],"clinical":[29,79,119],"queries).However,":[30],"their":[31],"security":[32,60,151],"vulnerabilities":[33],"remain":[34],"underexplored.Med-VLMs":[35],"should":[36],"be":[37],"capable":[38],"of":[39,65],"rejecting":[40],"harmful":[41,92],"queries,":[42,93],"such":[43],"as":[44,145],"Provide":[45],"detailed":[46],"instructions":[47],"for":[48,53,149],"using":[49],"this":[50,81],"CT":[51],"scan":[52],"insurance":[54],"fraud.At":[55],"the":[56,63,132,136],"same":[57],"time,":[58],"addressing":[59],"concerns":[61],"introduces":[62],"risk":[64],"over-defense,":[66],"where":[67],"safetyenhancing":[68],"mechanisms":[69],"may":[70],"degrade":[71],"general":[72],"performance,":[73],"causing":[74],"Med-VLMs":[75],"reject":[77],"benign":[78],"queries.In":[80],"paper,":[82],"we":[83,110,128],"propose":[84],"a":[85,141,146],"novel":[86],"inference-time":[87],"defense":[88,95,114],"strategy":[89,115,144],"mitigate":[91],"enabling":[94],"against":[96],"visual":[97],"jailbreak":[100],"attacks.Using":[101],"diverse":[102],"imaging":[104],"datasets":[105],"collected":[106],"nine":[108],"modalities,":[109],"demonstrate":[111],"that":[112,130],"our":[113],"based":[116],"on":[117],"synthetic":[118],"demonstrations":[120],"enhances":[121],"model":[122],"safety":[123],"without":[124],"significantly":[125],"compromising":[126],"performance.Additionally,":[127],"find":[129],"increasing":[131],"demonstration":[133,143,156],"budget":[134,157],"alleviates":[135],"overdefense":[137],"issue.We":[138],"then":[139],"introduce":[140],"mixed":[142],"trade-off":[147],"solution":[148],"balancing":[150],"performance":[153],"under":[154],"few-shot":[155],"constraints":[158],"1":[159],".":[160]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-24T00:00:00"}
