{"id":"https://openalex.org/W7134810499","doi":"https://doi.org/10.48550/arxiv.2603.07769","title":"MedQ-Deg: A Multidimensional Benchmark for Evaluating MLLMs Across Medical Image Quality Degradations","display_name":"MedQ-Deg: A Multidimensional Benchmark for Evaluating MLLMs Across Medical Image Quality Degradations","publication_year":2026,"publication_date":"2026-03-08","ids":{"openalex":"https://openalex.org/W7134810499","doi":"https://doi.org/10.48550/arxiv.2603.07769"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.07769","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128675610","display_name":"Jiyao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Jiyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101263879","display_name":"Junzhi Ning","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ning, Junzhi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128638826","display_name":"Chenglong Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Chenglong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078398555","display_name":"Wanying Qu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Wanying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090122335","display_name":"Jianghan Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Jianghan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128641440","display_name":"Siqi Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Siqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100586103","display_name":"Jinjie Wei","orcid":"https://orcid.org/0009-0003-5570-0880"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Jinjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128639324","display_name":"Jin Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Jin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128651903","display_name":"Pengze Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Pengze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128655997","display_name":"Tianbin Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Tianbin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100568833","display_name":"Jiashi Lin","orcid":"https://orcid.org/0000-0002-2696-6204"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Jiashi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049086157","display_name":"Hongming Shan","orcid":"https://orcid.org/0000-0002-0604-3197"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shan, Hongming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121124146","display_name":"Xinzhe Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Xinzhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128682219","display_name":"Xiaohong Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaohong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085516582","display_name":"Lihao Liu","orcid":"https://orcid.org/0000-0002-8983-2342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Lihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128650376","display_name":"Junjun He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Junjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128689564","display_name":"Ningsheng Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Ningsheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":17,"corresponding_author_ids":["https://openalex.org/A5128675610"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.28760001063346863,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.28760001063346863,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11894","display_name":"Radiology practices and education","score":0.12380000203847885,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.09139999747276306,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7599999904632568},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6327000260353088},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.5861999988555908},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5231000185012817},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.5059999823570251},{"id":"https://openalex.org/keywords/image-quality","display_name":"Image quality","score":0.48969998955726624},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.460099995136261},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.4429999887943268}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7599999904632568},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7240999937057495},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6327000260353088},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.5861999988555908},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5526999831199646},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5444999933242798},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5231000185012817},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.5059999823570251},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.48969998955726624},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4740000069141388},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.460099995136261},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.4429999887943268},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.4361000061035156},{"id":"https://openalex.org/C44249647","wikidata":"https://www.wikidata.org/wiki/Q208498","display_name":"Confidence interval","level":2,"score":0.39500001072883606},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3720000088214874},{"id":"https://openalex.org/C2779679103","wikidata":"https://www.wikidata.org/wiki/Q5251805","display_name":"Degradation (telecommunications)","level":2,"score":0.3653999865055084},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3197000026702881},{"id":"https://openalex.org/C2983241795","wikidata":"https://www.wikidata.org/wiki/Q6806500","display_name":"Medical decision making","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C2779346075","wikidata":"https://www.wikidata.org/wiki/Q7268763","display_name":"Quality Score","level":3,"score":0.29429998993873596},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2565999925136566}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.07769","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.07769","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.07769","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.07769","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"impressive":[1],"performance":[2,118,139],"on":[3],"standard":[4],"benchmarks,":[5],"multimodal":[6],"large":[7],"language":[8],"models":[9,147,164],"(MLLMs)":[10],"face":[11],"critical":[12,134],"challenges":[13],"in":[14,191],"real-world":[15],"clinical":[16,193],"environments":[17],"where":[18],"medical":[19,39,62,184],"images":[20],"inevitably":[21],"suffer":[22],"various":[23],"quality":[24,41,66],"degradations.":[25,67],"Existing":[26],"benchmarks":[27],"exhibit":[28,149],"two":[29],"key":[30],"limitations:":[31],"(1)":[32,136],"absence":[33],"of":[34,128],"large-scale,":[35],"multidimensional":[36],"assessment":[37],"across":[38,170],"image":[40,65],"gradients":[42],"and":[43,81,116,162,175,189],"(2)":[44,146],"no":[45],"systematic":[46],"confidence":[47,115,157],"calibration":[48],"analysis.":[49],"To":[50],"address":[51],"these":[52],"gaps,":[53],"we":[54],"present":[55],"MedQ-Deg,":[56],"a":[57,112],"comprehensive":[58,126],"benchmark":[59],"for":[60],"evaluating":[61],"MLLMs":[63,131,185],"under":[64,123],"MedQ-Deg":[68,180],"provides":[69],"multi-dimensional":[70],"evaluation":[71,127],"spanning":[72],"18":[73],"distinct":[74],"degradation":[75,90,143,176],"types,":[76],"30":[77],"fine-grained":[78],"capability":[79,171],"dimensions,":[80,172],"7":[82],"imaging":[83,173],"modalities,":[84,174],"with":[85],"24,894":[86],"question-answer":[87],"pairs.":[88],"Each":[89],"is":[91],"implemented":[92],"at":[93],"3":[94],"severity":[95,144],"degrees,":[96],"calibrated":[97],"by":[98],"expert":[99],"radiologists.":[100],"We":[101,178],"further":[102],"introduce":[103],"Calibration":[104],"Shift":[105],"metric,":[106],"which":[107],"quantifies":[108],"the":[109,150],"gap":[110],"between":[111],"model's":[113],"perceived":[114],"actual":[117],"to":[119],"assess":[120],"metacognitive":[121],"reliability":[122],"degradation.":[124],"Our":[125],"40":[129],"mainstream":[130],"reveals":[132],"several":[133],"findings:":[135],"overall":[137],"model":[138],"degrades":[140],"systematically":[141],"as":[142],"increases,":[145],"universally":[148],"AI":[151],"Dunning-Kruger":[152],"Effect,":[153],"maintaining":[154],"inappropriately":[155],"high":[156],"despite":[158],"severe":[159],"accuracy":[160],"collapse,":[161],"(3)":[163],"display":[165],"markedly":[166],"differentiated":[167],"behavioral":[168],"patterns":[169],"types.":[177],"hope":[179],"drives":[181],"progress":[182],"toward":[183],"that":[186],"are":[187],"robust":[188],"trustworthy":[190],"real":[192],"practice.":[194]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-11T00:00:00"}
