{"id":"https://openalex.org/W7117480724","doi":"https://doi.org/10.1109/dicta68720.2025.11302462","title":"Generating Clinically Relevant Reports from Chest X-Rays for Cardiomegaly Diagnosis","display_name":"Generating Clinically Relevant Reports from Chest X-Rays for Cardiomegaly Diagnosis","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7117480724","doi":"https://doi.org/10.1109/dicta68720.2025.11302462"},"language":null,"primary_location":{"id":"doi:10.1109/dicta68720.2025.11302462","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dicta68720.2025.11302462","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Digital Image Computing: Techniques and Applications (DICTA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069545297","display_name":"Chayan Mondal","orcid":"https://orcid.org/0000-0002-3871-1065"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Chayan Mondal","raw_affiliation_strings":["School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121489144","display_name":"Chai Ken Kai","orcid":null},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chai Ken Kai","raw_affiliation_strings":["School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004852178","display_name":"Duc-Son Pham","orcid":"https://orcid.org/0000-0002-4006-7803"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Duc-Son Pham","raw_affiliation_strings":["School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091801631","display_name":"Tele Tan","orcid":"https://orcid.org/0000-0003-3195-3480"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Tele Tan","raw_affiliation_strings":["School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121446795","display_name":"Tom Gedeon","orcid":null},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Tom Gedeon","raw_affiliation_strings":["School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Computing and Mathematical Sciences, Curtin University,Perth,Western Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121516607","display_name":"Ashu Gupta","orcid":null},"institutions":[{"id":"https://openalex.org/I2800728469","display_name":"Fiona Stanley Hospital","ror":"https://ror.org/027p0bm56","country_code":"AU","type":"healthcare","lineage":["https://openalex.org/I2799506148","https://openalex.org/I2800728469","https://openalex.org/I2800882159","https://openalex.org/I4388446375","https://openalex.org/I4388482742"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ashu Gupta","raw_affiliation_strings":["Fiona Stanley Hospital,Radiology Department, Medical Imaging,Perth,Western Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fiona Stanley Hospital,Radiology Department, Medical Imaging,Perth,Western Australia","institution_ids":["https://openalex.org/I2800728469"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5069545297"],"corresponding_institution_ids":["https://openalex.org/I205640436"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.62002299,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.22779999673366547,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.22779999673366547,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.19059999287128448,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1446000039577484,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5184999704360962},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5175999999046326},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5139999985694885},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.5044000148773193},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.45489999651908875},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.44679999351501465},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4163999855518341}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6049000024795532},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5846999883651733},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5184999704360962},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5175999999046326},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5139999985694885},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.5044000148773193},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.45489999651908875},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.44679999351501465},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4163999855518341},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4036000072956085},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.373199999332428},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.36809998750686646},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.3343999981880188},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.33390000462532043},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.32850000262260437},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32510000467300415},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3100000023841858},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2775999903678894},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.275299996137619},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.26750001311302185},{"id":"https://openalex.org/C544519230","wikidata":"https://www.wikidata.org/wiki/Q32566","display_name":"Computed tomography","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2533999979496002},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dicta68720.2025.11302462","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dicta68720.2025.11302462","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Digital Image Computing: Techniques and Applications (DICTA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4464883506298065,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2770165365","https://openalex.org/W2963967185","https://openalex.org/W2995225687","https://openalex.org/W3114128166","https://openalex.org/W3138516171","https://openalex.org/W3151410070","https://openalex.org/W3163537520","https://openalex.org/W4200122203","https://openalex.org/W4321021687","https://openalex.org/W4387698276","https://openalex.org/W4390905318","https://openalex.org/W4391305966","https://openalex.org/W4403109359","https://openalex.org/W4405446156","https://openalex.org/W4407474086","https://openalex.org/W4411026889","https://openalex.org/W4411336987"],"related_works":[],"abstract_inverted_index":{"Despite":[0],"significant":[1],"advancements":[2],"in":[3,185,216],"automatic":[4],"Xray":[5],"report":[6,108,166],"generation,":[7],"clinical":[8,20,218],"adoption":[9],"remains":[10],"limited.":[11],"A":[12],"key":[13],"barrier":[14],"is":[15],"the":[16,61,68,73,77,107,125,135,157,186,209],"lack":[17],"of":[18,72,134,205,211],"structured":[19],"metrics\u2013such":[21],"as":[22],"anatomical":[23,214],"measurements\u2013within":[24],"generated":[25],"reports,":[26],"which":[27,92],"hinders":[28],"their":[29,45],"practical":[30],"utility":[31],"for":[32,188],"diagnosis.":[33],"Current":[34],"languageand":[35],"vision-language-based":[36],"approaches":[37],"typically":[38],"overlook":[39],"these":[40],"quantitative":[41,189],"components":[42],"due":[43],"to":[44,76,94],"inherent":[46],"learning":[47],"constraints.":[48],"In":[49],"this":[50],"work,":[51],"we":[52,116,141,155],"focus":[53],"on":[54,124],"cardiomegaly,":[55],"a":[56,118,143,161],"common":[57],"thoracic":[58,138],"condition":[59],"where":[60],"cardiothoracic":[62],"ratio":[63],"(CTR)\u2013a":[64],"measurement":[65],"derived":[66],"from":[67],"width":[69],"and":[70,137,153,172,201],"height":[71],"heart":[74,136],"relative":[75],"thorax\u2013is":[78],"an":[79],"essential":[80],"diagnostic":[81],"metric.":[82],"Unlike":[83],"large":[84],"language":[85],"models":[86,90],"(LLMs)":[87],"or":[88],"vision-language":[89],"(VLMs),":[91],"struggle":[93],"extract":[95],"such":[96],"precise":[97],"geometric":[98],"features,":[99],"our":[100,191],"approach":[101],"explicitly":[102],"incorporates":[103],"CTR":[104,158,180,197],"estimation":[105],"into":[106,160],"generation":[109,167],"process.":[110],"Our":[111],"contributions":[112],"are":[113,182],"threefold:":[114],"(1)":[115],"introduce":[117],"novel":[119],"cardiomegaly-specific":[120],"annotation":[121],"set":[122],"based":[123],"MIMIC-CXR":[126],"dataset,":[127],"comprising":[128],"300":[129],"manually":[130],"annotated":[131],"bounding":[132],"boxes":[133],"cavity;":[139],"(2)":[140],"develop":[142],"YOLOv11-based":[144],"cardiomegaly":[145],"detector":[146],"that":[147,195],"achieves":[148],"over":[149],"99%":[150],"AP@50":[151],"performance;":[152],"(3)":[154],"integrate":[156],"computation":[159],"Vision":[162],"Encoder":[163],"Decoder":[164],"(VED)-based":[165],"model,":[168],"enabling":[169],"more":[170,199],"refined":[171],"clinically":[173],"aligned":[174],"radiology":[175],"reports.":[176],"Although":[177],"ground":[178],"truth":[179],"values":[181],"not":[183],"available":[184],"dataset":[187],"evaluation,":[190],"qualitative":[192],"results":[193],"demonstrate":[194],"incorporating":[196,212],"enables":[198],"accurate":[200],"interpretable":[202],"severity":[203],"descriptions":[204],"cardiomegaly.":[206],"This":[207],"highlights":[208],"effectiveness":[210],"explicit":[213],"measurements":[215],"enhancing":[217],"usability.":[219]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2025-12-29T00:00:00"}
