{"id":"https://openalex.org/W7126019331","doi":"https://doi.org/10.1109/bibm66473.2025.11356296","title":"Advancing Reliable Medical VQA: Evaluation and Enhancement of Model Robustness","display_name":"Advancing Reliable Medical VQA: Evaluation and Enhancement of Model Robustness","publication_year":2025,"publication_date":"2025-12-15","ids":{"openalex":"https://openalex.org/W7126019331","doi":"https://doi.org/10.1109/bibm66473.2025.11356296"},"language":null,"primary_location":{"id":"doi:10.1109/bibm66473.2025.11356296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070538578","display_name":"Shuning He","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuning He","raw_affiliation_strings":["Harbin Engineering University,Department of Computer Science and Technology,Harbin,China"],"affiliations":[{"raw_affiliation_string":"Harbin Engineering University,Department of Computer Science and Technology,Harbin,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124289130","display_name":"Da Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Da Ren","raw_affiliation_strings":["The Hong Kong Polytechnic University,Department of Computing,Hong Kong,China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University,Department of Computing,Hong Kong,China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124282722","display_name":"Haiwei Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiwei Pan","raw_affiliation_strings":["Harbin Engineering University,Department of Computer Science and Technology,Harbin,China"],"affiliations":[{"raw_affiliation_string":"Harbin Engineering University,Department of Computer Science and Technology,Harbin,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124230893","display_name":"Kejia Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kejia Zhang","raw_affiliation_strings":["Harbin Engineering University,Department of Computer Science and Technology,Harbin,China"],"affiliations":[{"raw_affiliation_string":"Harbin Engineering University,Department of Computer Science and Technology,Harbin,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124177002","display_name":"Qing Li","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qing Li","raw_affiliation_strings":["The Hong Kong Polytechnic University,Department of Computing,Hong Kong,China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University,Department of Computing,Hong Kong,China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5070538578"],"corresponding_institution_ids":["https://openalex.org/I151727225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.68968424,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5637","last_page":"5642"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9641000032424927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9641000032424927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.009499999694526196,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.004800000227987766,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8044999837875366},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6243000030517578},{"id":"https://openalex.org/keywords/medical-research","display_name":"Medical research","score":0.41029998660087585},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.3930000066757202},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.35339999198913574},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.33570000529289246}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8044999837875366},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6976000070571899},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6243000030517578},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5034000277519226},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48809999227523804},{"id":"https://openalex.org/C106977388","wikidata":"https://www.wikidata.org/wiki/Q2752427","display_name":"Medical research","level":2,"score":0.41029998660087585},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.3930000066757202},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3580000102519989},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.35339999198913574},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3127000033855438},{"id":"https://openalex.org/C2982822547","wikidata":"https://www.wikidata.org/wiki/Q179661","display_name":"Medical treatment","level":2,"score":0.30469998717308044},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.2897000014781952},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C2988170871","wikidata":"https://www.wikidata.org/wiki/Q11000047","display_name":"Healthcare system","level":3,"score":0.2578999996185303},{"id":"https://openalex.org/C503897019","wikidata":"https://www.wikidata.org/wiki/Q195818","display_name":"Medical simulation","level":2,"score":0.25200000405311584},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm66473.2025.11356296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4889963131","display_name":null,"funder_award_id":"62072135","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1588748369","https://openalex.org/W1988883951","https://openalex.org/W2023910643","https://openalex.org/W2025759276","https://openalex.org/W2059784307","https://openalex.org/W2098092211","https://openalex.org/W2120015570","https://openalex.org/W2137236456","https://openalex.org/W2790477006","https://openalex.org/W2794856002","https://openalex.org/W2901466771","https://openalex.org/W2979525559","https://openalex.org/W3165058054","https://openalex.org/W4243260771","https://openalex.org/W4250894278","https://openalex.org/W4283258232","https://openalex.org/W4386566421","https://openalex.org/W4390992001"],"related_works":[],"abstract_inverted_index":{"Medical":[0],"artificial":[1],"intelligence":[2],"(AI)":[3],"plays":[4],"a":[5,28,126,133,165,185,221],"central":[6],"role":[7],"in":[8,89,102,109,224],"advancing":[9],"the":[10,50,66,115,176,232],"rapid":[11],"development":[12],"of":[13,69,96,117,179,201],"AI-driven":[14],"healthcare":[15],"technologies.":[16],"Among":[17],"these":[18,105],"applications,":[19],"medical":[20,39,70,74,130,143,180,190,203,225],"visual":[21,191],"question":[22,192],"answering":[23,193],"(VQA)":[24],"has":[25],"emerged":[26],"as":[27],"critical":[29],"component,":[30],"garnering":[31],"significant":[32,222],"research":[33],"attention.":[34],"However,":[35],"current":[36,229],"approaches":[37],"to":[38,54,81,93,114,137,171,196],"VQA":[40,71,131,204],"predominantly":[41],"prioritize":[42],"achieving":[43],"high":[44],"accuracy":[45],"on":[46,206],"constrained":[47],"datasets,":[48],"overlooking":[49],"multifaceted":[51],"challenges":[52,106],"inherent":[53],"real-world":[55,103,157],"clinical":[56,97],"deployment.":[57,237],"In":[58],"practical":[59,236],"settings,":[60],"two":[61],"key":[62],"factors":[63],"significantly":[64],"influence":[65],"input":[67],"reliability":[68],"systems.":[72],"First,":[73],"imaging":[75,144],"processes":[76],"inherently":[77],"introduce":[78],"noise":[79,158,215],"due":[80,113],"technical":[82],"and":[83,145,159,188,216],"environmental":[84],"variability.":[85,161,217],"Second,":[86],"linguistic":[87,146],"diversity":[88],"patient-provider":[90],"interactions":[91],"leads":[92],"heterogeneous":[94],"phrasing":[95],"questions.":[98],"Despite":[99],"their":[100,209],"inevitability":[101],"scenarios,":[104],"remain":[107],"understudied":[108],"existing":[110,151,202],"research,":[111,227],"largely":[112],"absence":[116],"dedicated":[118],"benchmarks.":[119],"To":[120],"address":[121],"this":[122],"gap,":[123],"we":[124],"propose":[125],"benchmark":[127,135,149],"for":[128,235],"robust":[129],"(RoM-VQA),":[132],"novel":[134],"designed":[136,195],"evaluate":[138,197],"model":[139,198],"robustness":[140,233],"from":[141],"both":[142],"perspectives.":[147],"This":[148],"extends":[150],"datasets":[152],"through":[153],"systematic":[154],"enhancements,":[155],"simulating":[156],"language":[160],"During":[162],"its":[163],"development,":[164],"multiLLM":[166],"collaborative":[167],"framework":[168],"is":[169],"implemented":[170],"minimize":[172],"human":[173],"intervention.":[174],"With":[175],"active":[177],"involvement":[178],"experts,":[181],"our":[182],"paper":[183],"constructs":[184],"diverse,":[186],"high-quality,":[187],"large-scale":[189],"dataset":[194],"robustness.":[199],"Evaluation":[200],"models":[205,230],"RoM-VQA":[207],"demonstrates":[208],"instability":[210],"when":[211],"confronted":[212],"with":[213],"diverse":[214],"These":[218],"results":[219],"highlight":[220],"gap":[223],"AI":[226],"where":[228],"lack":[231],"necessary":[234]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-30T00:00:00"}
