{"id":"https://openalex.org/W7161744240","doi":"https://doi.org/10.48550/arxiv.2605.17140","title":"UCSF-PDGM-VQA: Visual Question Answering dataset for brain tumor MRI interpretation","display_name":"UCSF-PDGM-VQA: Visual Question Answering dataset for brain tumor MRI interpretation","publication_year":2026,"publication_date":"2026-05-16","ids":{"openalex":"https://openalex.org/W7161744240","doi":"https://doi.org/10.48550/arxiv.2605.17140"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17140","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136492021","display_name":"Shiv Ghosh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghosh, Shiv","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120084472","display_name":"Junayd Lateef","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lateef, Junayd","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136476435","display_name":"Chih-Hua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Chih-Hua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136472610","display_name":"liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Yannan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136467266","display_name":"Yannan Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rauschecker, Andreas M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5029857320","display_name":"Andreas M. Rauschecker","orcid":"https://orcid.org/0000-0003-0633-9876"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sushil, Madhumita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9210000038146973,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9210000038146973,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.019600000232458115,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.016300000250339508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5785999894142151},{"id":"https://openalex.org/keywords/interpretation","display_name":"Interpretation (philosophy)","score":0.5454000234603882},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5246999859809875},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5196999907493591},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5174000263214111},{"id":"https://openalex.org/keywords/magnetic-resonance-imaging","display_name":"Magnetic resonance imaging","score":0.5016000270843506},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.44609999656677246},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.42879998683929443}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6272000074386597},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5785999894142151},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.5454000234603882},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5196999907493591},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5174000263214111},{"id":"https://openalex.org/C143409427","wikidata":"https://www.wikidata.org/wiki/Q161238","display_name":"Magnetic resonance imaging","level":2,"score":0.5016000270843506},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.44609999656677246},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4453999996185303},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.42879998683929443},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41190001368522644},{"id":"https://openalex.org/C2779130545","wikidata":"https://www.wikidata.org/wiki/Q233309","display_name":"Brain tumor","level":2,"score":0.38850000500679016},{"id":"https://openalex.org/C58693492","wikidata":"https://www.wikidata.org/wiki/Q551875","display_name":"Neuroimaging","level":2,"score":0.3734000027179718},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3149999976158142},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.29440000653266907},{"id":"https://openalex.org/C2988762625","wikidata":"https://www.wikidata.org/wiki/Q492038","display_name":"Brain anatomy","level":3,"score":0.29330000281333923},{"id":"https://openalex.org/C2779226451","wikidata":"https://www.wikidata.org/wiki/Q903809","display_name":"Functional magnetic resonance imaging","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.28380000591278076},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Brain":[0],"tumor":[1],"diagnosis":[2],"is":[3,38,48],"largely":[4],"dependent":[5],"on":[6,140,167],"Magnetic":[7],"Resonance":[8],"Imaging":[9],"(MRI)":[10],"evaluation,":[11],"which":[12],"requires":[13,29],"radiologists":[14],"to":[15,50,63,84],"synthesize":[16],"thousands":[17],"of":[18,72,87,109,150,162,191],"images":[19],"across":[20],"multiple":[21],"3D":[22],"sequences":[23],"and":[24,37,135,165,183],"longitudinal":[25],"studies.":[26],"This":[27],"process":[28],"advanced":[30],"neuro-radiology":[31],"training,":[32],"poses":[33],"substantial":[34],"cognitive":[35],"load,":[36],"highly":[39],"time-consuming.":[40],"Despite":[41],"increasing":[42],"demands":[43],"in":[44,81,118,159,179],"radiology,":[45],"this":[46,65,141],"expertise":[47],"difficult":[49],"scale,":[51],"straining":[52],"the":[53,104,119,189],"current":[54,146,180],"health":[55],"systems.":[56],"Vision-Language":[57],"Models":[58],"(VLMs)":[59,134],"provide":[60],"an":[61],"opportunity":[62],"reduce":[64],"burden":[66],"through":[67],"a":[68,85,95,126,160,176],"semi-automated,":[69],"interactive":[70],"interpretation":[71],"complex":[73],"brain":[74],"MRIs.":[75],"However,":[76],"they":[77],"are":[78,148],"currently":[79],"underutilized":[80],"neuro-oncology":[82],"due":[83],"lack":[86],"specialized":[88],"benchmarks":[89],"for":[90,129],"evaluating":[91],"them.":[92],"We":[93,123,143],"introduce":[94],"clinically":[96],"relevant":[97],"visual":[98,163],"question":[99],"answering":[100],"(VQA)":[101],"benchmark":[102],"--":[103,107],"UCSF-PDGM-VQA":[105],"dataset":[106],"consisting":[108],"2,387":[110],"QA":[111],"pairs":[112],"from":[113],"473":[114],"glioma-related":[115],"MRI":[116,155],"studies":[117],"public":[120],"UCSF-PDGM":[121],"dataset.":[122,142],"further":[124],"establish":[125],"performance":[127],"baseline":[128],"six":[130],"state-of-the-art":[131],"vision-language":[132],"models":[133,147],"one":[136],"large":[137],"language":[138,168],"model":[139,181],"find":[144],"that":[145],"incapable":[149],"effectively":[151],"processing":[152],"multi-sequence,":[153],"3-dimensional":[154],"scans,":[156],"thus":[157],"resulting":[158],"suppression":[161],"features":[164],"over-reliance":[166],"priors,":[169],"causing":[170],"modality":[171],"collapse.":[172],"These":[173],"findings":[174],"underscore":[175],"critical":[177],"deficiency":[178],"reliability":[182],"safety":[184],"within":[185],"clinical":[186],"settings,":[187],"necessitating":[188],"development":[190],"robust,":[192],"domain-specific":[193],"VLMs.":[194]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
