{"id":"https://openalex.org/W7126031496","doi":"https://doi.org/10.1109/bibm66473.2025.11356359","title":"Med-SER: Enhancing Reasoning Interpretability in Medical Visual Question Answering via Structured Chain-of-Thought","display_name":"Med-SER: Enhancing Reasoning Interpretability in Medical Visual Question Answering via Structured Chain-of-Thought","publication_year":2025,"publication_date":"2025-12-15","ids":{"openalex":"https://openalex.org/W7126031496","doi":"https://doi.org/10.1109/bibm66473.2025.11356359"},"language":null,"primary_location":{"id":"doi:10.1109/bibm66473.2025.11356359","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079546611","display_name":"Jinhao Qiao","orcid":"https://orcid.org/0009-0002-8434-1445"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jinhao Qiao","raw_affiliation_strings":["Hunan University,Changsha,China"],"affiliations":[{"raw_affiliation_string":"Hunan University,Changsha,China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100610996","display_name":"Sihan Li","orcid":"https://orcid.org/0000-0003-2496-7147"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]},{"id":"https://openalex.org/I4210089761","display_name":"West China Hospital of Sichuan University","ror":"https://ror.org/007mrxy13","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210089761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sihan Li","raw_affiliation_strings":["West China Hospital of Sichuan University,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"West China Hospital of Sichuan University,Chengdu,China","institution_ids":["https://openalex.org/I24185976","https://openalex.org/I4210089761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085263960","display_name":"J. Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210137977","display_name":"Advanced Micro Devices (United States)","ror":"https://ror.org/04kd6c783","country_code":"US","type":"company","lineage":["https://openalex.org/I4210137977"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiang Liu","raw_affiliation_strings":["Advanced Micro Devices,California,USA"],"affiliations":[{"raw_affiliation_string":"Advanced Micro Devices,California,USA","institution_ids":["https://openalex.org/I4210137977"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101867679","display_name":"Heng Yu","orcid":"https://orcid.org/0000-0003-4391-7233"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Heng Yu","raw_affiliation_strings":["Hunan University,Changsha,China","Stanford University,California,USA"],"affiliations":[{"raw_affiliation_string":"Hunan University,Changsha,China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"Stanford University,California,USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108974443","display_name":"Y. L. Xiao","orcid":"https://orcid.org/0009-0005-7890-5306"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Xiao","raw_affiliation_strings":["Hunan University,Changsha,China"],"affiliations":[{"raw_affiliation_string":"Hunan University,Changsha,China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033804543","display_name":"D. L. Yao","orcid":null},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Hongshan Yu","raw_affiliation_strings":["Hunan University,Changsha,China","Stanford University,California,USA"],"affiliations":[{"raw_affiliation_string":"Hunan University,Changsha,China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"Stanford University,California,USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5120850132","display_name":"Yupeng Zheng","orcid":"https://orcid.org/0000-0003-4720-7378"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Zheng","raw_affiliation_strings":["Hunan University,Changsha,China"],"affiliations":[{"raw_affiliation_string":"Hunan University,Changsha,China","institution_ids":["https://openalex.org/I16609230"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5079546611"],"corresponding_institution_ids":["https://openalex.org/I16609230"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.72235019,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4036","last_page":"4040"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0013000000035390258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.00039999998989515007,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9562000036239624},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.7332000136375427},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.602400004863739},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5322999954223633},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5153999924659729},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.48350000381469727},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4147999882698059}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9562000036239624},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.734000027179718},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.7332000136375427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6929000020027161},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.602400004863739},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5322999954223633},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5153999924659729},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.48350000381469727},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4259999990463257},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4147999882698059},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3772999942302704},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.3578000068664551},{"id":"https://openalex.org/C97364631","wikidata":"https://www.wikidata.org/wiki/Q484284","display_name":"Deductive reasoning","level":2,"score":0.2782000005245209},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C134752490","wikidata":"https://www.wikidata.org/wiki/Q374182","display_name":"Logical consequence","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.2685999870300293},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25760000944137573},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm66473.2025.11356359","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2901466771","https://openalex.org/W2911489562","https://openalex.org/W2965373594","https://openalex.org/W3046375318","https://openalex.org/W3091737531","https://openalex.org/W4379879090","https://openalex.org/W4386566421","https://openalex.org/W4386882992","https://openalex.org/W4399353257","https://openalex.org/W4404782528","https://openalex.org/W4406160879","https://openalex.org/W4410953625"],"related_works":[],"abstract_inverted_index":{"Existing":[0],"Medical":[1],"Visual":[2,75],"Question":[3],"Answering":[4],"(Med-VQA)":[5],"methods":[6],"typically":[7],"rely":[8],"on":[9,103],"either":[10],"direct":[11],"answer":[12],"generation":[13],"or":[14,25],"Chain-of-Thought":[15,40],"(CoT)":[16],"reasoning,":[17],"both":[18,81],"of":[19,111],"which":[20,42],"suffer":[21],"from":[22],"limited":[23],"interpretability":[24],"logical":[26,99],"inconsistency.":[27],"To":[28,55],"overcome":[29],"these":[30],"challenges,":[31],"we":[32,58],"propose":[33],"Med-SER,":[34],"a":[35,73,88,115],"novel":[36],"framework":[37],"featuring":[38],"Structured":[39],"(SCoT),":[41],"decomposes":[43],"reasoning":[44,68],"into":[45],"four":[46],"clinically":[47],"grounded":[48],"stages:":[49],"Summary,":[50],"Caption,":[51],"Reasoning,":[52],"and":[53,83,87,98,118],"Conclusion.":[54],"facilitate":[56],"training,":[57],"construct":[59],"VQA-RAD-SCoT,":[60],"the":[61,109],"first":[62],"Med-VQA":[63],"dataset":[64],"annotated":[65],"with":[66],"structured":[67],"chains.":[69],"Med-SER":[70,107,112],"further":[71],"introduces":[72],"Dual-Channel":[74],"Projection":[76],"(DCVP)":[77],"module":[78],"to":[79,113],"extract":[80],"holistic":[82],"stage-specific":[84],"visual":[85],"features,":[86],"Dual":[89],"Dynamic":[90],"Supervision":[91],"(DDS)":[92],"mechanism":[93],"combining":[94],"adaptive":[95],"stage-aware":[96],"weighting":[97],"consistency":[100],"loss.":[101],"Experiments":[102],"VQA-RAD-SCoT":[104],"demonstrate":[105],"that":[106],"demonstrates":[108],"potential":[110],"establish":[114],"new":[116],"interpretable":[117],"trustworthy":[119],"paradigm":[120],"for":[121],"Med-VQA.":[122]},"counts_by_year":[],"updated_date":"2026-02-01T03:34:12.195049","created_date":"2026-01-30T00:00:00"}
