{"id":"https://openalex.org/W4415879973","doi":"https://doi.org/10.48550/arxiv.2510.15418","title":"Fine-Tuning MedGemma for Clinical Captioning to Enhance Multimodal RAG over Malaysia CPGs","display_name":"Fine-Tuning MedGemma for Clinical Captioning to Enhance Multimodal RAG over Malaysia CPGs","publication_year":2025,"publication_date":"2025-10-17","ids":{"openalex":"https://openalex.org/W4415879973","doi":"https://doi.org/10.48550/arxiv.2510.15418"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2510.15418","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.15418","pdf_url":"https://arxiv.org/pdf/2510.15418","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.15418","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120250595","display_name":"Lee Qi Zun","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zun, Lee Qi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120250596","display_name":"Mohamad Zulhilmi Bin Abdul Halim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Halim, Mohamad Zulhilmi Bin Abdul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5120250597","display_name":"Goh Man Fye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fye, Goh Man","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5120250595"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9569000005722046,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9569000005722046,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.009100000374019146,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0026000000070780516,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8489000201225281},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6851000189781189},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.31610000133514404},{"id":"https://openalex.org/keywords/clinical-practice","display_name":"Clinical Practice","score":0.31189998984336853}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8489000201225281},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.696399986743927},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6851000189781189},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5098000168800354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5062999725341797},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32019999623298645},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.31610000133514404},{"id":"https://openalex.org/C2779974597","wikidata":"https://www.wikidata.org/wiki/Q28448986","display_name":"Clinical Practice","level":2,"score":0.31189998984336853},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.27140000462532043},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.24169999361038208}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2510.15418","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.15418","pdf_url":"https://arxiv.org/pdf/2510.15418","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.15418","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.15418","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.15418","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.15418","pdf_url":"https://arxiv.org/pdf/2510.15418","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Retrieval-Augmented":[0],"Generation":[1],"systems":[2,168],"are":[3],"essential":[4],"for":[5,46,147,164],"providing":[6],"fact-based":[7],"guidance":[8],"from":[9],"Malaysian":[10],"Clinical":[11],"Practice":[12],"Guidelines.":[13],"However,":[14],"their":[15],"effectiveness":[16],"with":[17],"image-based":[18],"queries":[19],"is":[20],"limited,":[21],"as":[22,52,156],"general":[23],"Vision-Language":[24],"Model":[25],"captions":[26,49],"often":[27],"lack":[28],"clinical":[29,171],"specificity":[30],"and":[31,37,73,77,109,129,151],"factual":[32],"grounding.":[33],"This":[34,141],"study":[35],"proposes":[36],"validates":[38,152],"a":[39,61,67,90,99,144,157],"framework":[40,92],"to":[41,65,135],"specialize":[42],"the":[43,81,103,132,153,162],"MedGemma":[44,79],"model":[45,113,155],"generating":[47],"high-fidelity":[48],"that":[50],"serve":[51],"superior":[53],"queries.":[54],"To":[55],"overcome":[56],"data":[57],"scarcity,":[58],"we":[59],"employ":[60],"knowledge":[62],"distillation":[63],"pipeline":[64,146],"create":[66],"synthetic":[68],"dataset":[69],"across":[70],"dermatology,":[71],"fundus,":[72],"chest":[74],"radiography":[75],"domains,":[76],"fine-tune":[78],"using":[80],"parameter-efficient":[82],"QLoRA":[83],"method.":[84],"Performance":[85],"was":[86],"rigorously":[87],"assessed":[88],"through":[89],"dual":[91],"measuring":[93],"both":[94],"classification":[95,118],"accuracy":[96],"and,":[97],"via":[98],"novel":[100],"application":[101],"of":[102],"RAGAS":[104,121],"framework,":[105],"caption":[106,127],"faithfulness,":[107],"relevancy,":[108],"correctness.":[110],"The":[111],"fine-tuned":[112],"demonstrated":[114],"substantial":[115],"improvements":[116],"in":[117,126,169],"performance,":[119],"while":[120],"evaluation":[122],"confirmed":[123],"significant":[124],"gains":[125],"faithfulness":[128],"correctness,":[130],"validating":[131],"models":[133],"ability":[134],"produce":[136],"reliable,":[137],"factually":[138],"grounded":[139],"descriptions.":[140],"work":[142],"establishes":[143],"robust":[145],"specializing":[148],"medical":[149],"VLMs":[150],"resulting":[154],"high-quality":[158],"query":[159],"generator,":[160],"laying":[161],"groundwork":[163],"enhancing":[165],"multimodal":[166],"RAG":[167],"evidence-based":[170],"decision":[172],"support.":[173]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-21T00:00:00"}
