{"id":"https://openalex.org/W7160643234","doi":"https://doi.org/10.48550/arxiv.2605.05810","title":"CXR-ContraBench: Benchmarking Negated-Option Attraction in Medical VLMs","display_name":"CXR-ContraBench: Benchmarking Negated-Option Attraction in Medical VLMs","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160643234","doi":"https://doi.org/10.48550/arxiv.2605.05810"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.05810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.05810","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135720814","display_name":"Zhengru Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Zhengru","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135726509","display_name":"Yanan Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yanan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135661702","display_name":"Yu Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135702608","display_name":"Senkang Forest Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Senkang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135706505","display_name":"Yixian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yixian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013699453","display_name":"Hangcheng Cao","orcid":"https://orcid.org/0000-0002-0957-8576"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Hangcheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135639826","display_name":"Wenbo Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Wenbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016290340","display_name":"Yuguang Fang","orcid":"https://orcid.org/0000-0002-1079-3871"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Yuguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.5532000064849854,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.5532000064849854,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.08449999988079071,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.04580000042915344,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7538999915122986},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7078999876976013},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5738999843597412},{"id":"https://openalex.org/keywords/statement","display_name":"Statement (logic)","score":0.41029998660087585},{"id":"https://openalex.org/keywords/byte","display_name":"Byte","score":0.3531000018119812},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.349700003862381},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.3495999872684479}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7538999915122986},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7078999876976013},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.605400025844574},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5738999843597412},{"id":"https://openalex.org/C2777026412","wikidata":"https://www.wikidata.org/wiki/Q2684591","display_name":"Statement (logic)","level":2,"score":0.41029998660087585},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3637999892234802},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.3531000018119812},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.349700003862381},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.3495999872684479},{"id":"https://openalex.org/C2776728590","wikidata":"https://www.wikidata.org/wiki/Q363948","display_name":"Contradiction","level":2,"score":0.34549999237060547},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33959999680519104},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32739999890327454},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C2777361361","wikidata":"https://www.wikidata.org/wiki/Q1112585","display_name":"Polarity (international relations)","level":3,"score":0.3165999948978424},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3077999949455261},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.296099990606308},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.2856999933719635},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2619999945163727},{"id":"https://openalex.org/C2779974597","wikidata":"https://www.wikidata.org/wiki/Q28448986","display_name":"Clinical Practice","level":2,"score":0.25619998574256897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.05810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.05810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.05810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5123509764671326,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"When":[0],"a":[1,14,31,36,50,55,78,132,148,218],"chest":[2],"X-ray":[3],"shows":[4],"consolidation":[5],"but":[6,171],"the":[7,40,65,69,105,125,190,206],"question":[8],"asks":[9],"which":[10],"finding":[11],"is":[12,23,30,52,127],"present,":[13],"medical":[15],"vision-language":[16],"model":[17,51],"may":[18],"answer":[19,57],"\"No":[20,99],"consolidation.\"":[21],"This":[22],"more":[24],"than":[25],"an":[26],"incorrect":[27],"choice:":[28],"it":[29,61],"polarity":[32,222],"reversal":[33],"that":[34,213],"emits":[35],"clinical":[37,107],"statement":[38],"contradicting":[39],"image.":[41],"We":[42,71],"study":[43],"this":[44],"failure":[45,126],"as":[46,113],"negated-option":[47],"attraction,":[48],"where":[49,97],"drawn":[53],"to":[54,200],"negated":[56,120,157],"option":[58],"even":[59],"when":[60],"conflicts":[62],"with":[63],"both":[64,154],"visual":[66],"evidence":[67],"and":[68,85,88,109,129,138,143,176,198,202,226],"question.":[70],"introduce":[72],"CXR-ContraBench":[73],"(Chest":[74],"X-Ray":[75],"Contradiction":[76],"Benchmark),":[77],"diagnostic":[79],"benchmark":[80,92,227],"spanning":[81],"internal":[82],"ReXVQA":[83],"slices":[84],"external":[86],"OpenI":[87],"CheXpert":[89,123,151],"protocols.":[90],"The":[91],"centers":[93],"on":[94,147,159,205],"present-finding":[95],"questions,":[96],"selecting":[98],"X\"":[100],"despite":[101],"visible":[102],"X":[103],"creates":[104],"main":[106],"risk,":[108],"uses":[110],"absent-finding":[111],"questions":[112],"secondary":[114],"tests":[115],"of":[116,162],"whether":[117],"models":[118,155],"copy":[119],"wording.":[121],"Across":[122],"protocols,":[124],"substantial":[128],"persistent.":[130],"On":[131],"strict":[133],"direct":[134,207],"presence":[135,163,208],"probe,":[136],"MedGemma":[137,197],"Qwen2.5-VL":[139,199],"reach":[140],"only":[141],"31.49%":[142],"30.21%":[144],"accuracy,":[145],"respectively;":[146],"matched":[149],"135,754-record":[150],"training-split":[152],"protocol,":[153],"select":[156],"options":[158],"over":[160],"62%":[161],"questions.":[164],"Chain-of-thought":[165],"prompting":[166],"reduces":[167],"some":[168],"presence-side":[169],"reversals":[170],"does":[172],"not":[173],"eliminate":[174],"them":[175],"can":[177,216],"amplify":[178],"absence-side":[179],"contradictions.":[180],"Finally,":[181],"QCCV-Neg":[182],"(Question-Conditioned":[183],"Consistency":[184],"Verifier":[185],"for":[186],"Negation)":[187],"deterministically":[188],"repairs":[189],"measured":[191],"polarity-confused":[192],"subset":[193],"without":[194],"retraining,":[195],"raising":[196],"96.60%":[201],"95.32%":[203],"accuracy":[204,215],"probe.":[209],"These":[210],"results":[211],"show":[212],"standard":[214],"hide":[217],"clinically":[219],"meaningful":[220],"inference-time":[221],"failure.":[223],"Source":[224],"code":[225],"construction":[228],"scripts":[229],"are":[230],"available":[231],"at":[232],"https://github.com/fangzr/cxr-contrabench-code.":[233]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-09T00:00:00"}
