{"id":"https://openalex.org/W7161788075","doi":"https://doi.org/10.1109/isbi61048.2026.11515920","title":"CTest-Metric: A Unified Framework to Assess Clinical Validity of Metrics for CT Report Generation","display_name":"CTest-Metric: A Unified Framework to Assess Clinical Validity of Metrics for CT Report Generation","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7161788075","doi":"https://doi.org/10.1109/isbi61048.2026.11515920"},"language":null,"primary_location":{"id":"doi:10.1109/isbi61048.2026.11515920","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isbi61048.2026.11515920","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE 23rd International Symposium on Biomedical Imaging (ISBI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043592090","display_name":"Vanshali Sharma","orcid":"https://orcid.org/0000-0003-0008-1579"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]},{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Vanshali Sharma","raw_affiliation_strings":["Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA","institution_ids":["https://openalex.org/I111979921","https://openalex.org/I1343180700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123350622","display_name":"Andrea Mia Bejar","orcid":null},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]},{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrea Mia Bejar","raw_affiliation_strings":["Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA","institution_ids":["https://openalex.org/I111979921","https://openalex.org/I1343180700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033826718","display_name":"G\u00f6rkem Durak","orcid":"https://orcid.org/0000-0002-1608-1955"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]},{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gorkem Durak","raw_affiliation_strings":["Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA","institution_ids":["https://openalex.org/I111979921","https://openalex.org/I1343180700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5136569863","display_name":"Ulas Bagci","orcid":null},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]},{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ulas Bagci","raw_affiliation_strings":["Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University,Machine and Hybrid Intelligence Lab,Chicago,IL,USA","institution_ids":["https://openalex.org/I111979921","https://openalex.org/I1343180700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5043592090"],"corresponding_institution_ids":["https://openalex.org/I111979921","https://openalex.org/I1343180700"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.92888159,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11894","display_name":"Radiology practices and education","score":0.4643000066280365,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11894","display_name":"Radiology practices and education","score":0.4643000066280365,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10206","display_name":"Meta-analysis and systematic reviews","score":0.11540000140666962,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.05829999968409538,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.33559998869895935},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.26499998569488525},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.2590999901294708},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.24950000643730164}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4887999892234802},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38659998774528503},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.33559998869895935},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3231000006198883},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.27959999442100525},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2734000086784363},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.24950000643730164},{"id":"https://openalex.org/C544519230","wikidata":"https://www.wikidata.org/wiki/Q32566","display_name":"Computed tomography","level":2,"score":0.24310000240802765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isbi61048.2026.11515920","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isbi61048.2026.11515920","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE 23rd International Symposium on Biomedical Imaging (ISBI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4895294555","display_name":null,"funder_award_id":"R01-HL171376","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2101105183","https://openalex.org/W2963466845","https://openalex.org/W4385546024","https://openalex.org/W4388713229","https://openalex.org/W4404622590","https://openalex.org/W4404781831","https://openalex.org/W4404782825","https://openalex.org/W4410295368","https://openalex.org/W4413887286","https://openalex.org/W4414364899"],"related_works":[],"abstract_inverted_index":{"In":[0],"the":[1,43,75,183],"generative":[2],"AI":[3],"era,":[4],"where":[5],"even":[6],"critical":[7],"medical":[8],"tasks":[9],"are":[10,127,147,190],"increasingly":[11],"automated,":[12],"radiology":[13],"report":[14],"generation":[15],"(RRG)":[16],"continues":[17],"to":[18,42,50,150,172],"rely":[19],"on":[20,110,133],"suboptimal":[21],"metrics":[22,28,79,117,146],"for":[23,80],"quality":[24],"assessment.":[25],"Developing":[26],"domain-specific":[27],"has":[29],"therefore":[30],"been":[31],"an":[32],"active":[33],"area":[34],"of":[35,45,78,182],"research,":[36],"yet":[37],"it":[38],"remains":[39],"challenging":[40],"due":[41],"lack":[44],"a":[46,65,134],"unified,":[47],"well-defined":[48],"framework":[49,70],"assess":[51],"their":[52],"robustness":[53],"and":[54,102,167,179],"applicability":[55],"in":[56],"clinical":[57,76],"contexts.":[58],"To":[59],"address":[60],"this,":[61],"we":[62,141],"present":[63],"CTest-Metric,":[64],"first":[66],"unified":[67],"metric":[68],"assessment":[69],"with":[71,157],"three":[72],"modules":[73,84],"determining":[74],"feasibility":[77],"CT":[81,188],"RRG.":[82],"The":[83,176],"test:":[85],"(i)":[86],"Writing":[87],"Style":[88],"Generalizability":[89],"(WSG)":[90],"via":[91],"LLM-based":[92],"rephrasing;":[93],"(ii)":[94],"Synthetic":[95],"Error":[96],"Injection":[97],"(SEI)":[98],"at":[99,192],"graded":[100],"severities;":[101],"(iii)":[103],"Metrics-vs-Expert":[104],"correlation":[105],"(MvE)":[106],"using":[107],"clinician":[108],"ratings":[109],"175":[111],"\u201cdisagreement\u201d":[112],"cases.":[113],"Eight":[114],"widely":[115],"used":[116],"(BLEU,":[118],"ROUGE,":[119],"METEOR,":[120],"BERTScore-F1,":[121],"F1-RadGraph,":[122],"RaTEScore,":[123],"GREEN":[124,153],"Score,":[125],"CRG)":[126],"studied":[128],"across":[129],"seven":[130],"LLMs":[131],"built":[132],"CT-CLIP":[135],"encoder.":[136],"Using":[137],"our":[138],"novel":[139],"framework,":[140,177],"found":[142],"that":[143],"lexical":[144],"NLG":[145],"highly":[148],"sensitive":[149,171],"stylistic":[151],"variations;":[152],"Score":[154],"aligns":[155],"best":[156],"expert":[158],"judgments":[159],"(Spearman":[160],"0.70),":[161],"while":[162],"CRG":[163],"shows":[164],"negative":[165],"correlation;":[166],"BERTScore-F1":[168],"is":[169],"least":[170],"factual":[173],"error":[174],"injection.":[175],"code,":[178],"allowable":[180],"portion":[181],"anonymized":[184],"evaluation":[185],"data":[186],"(rephrased/error-injected":[187],"reports)":[189],"available":[191],"https://github.com/NUBagciLab/CTestMetric.":[193]},"counts_by_year":[],"updated_date":"2026-05-22T06:13:13.366637","created_date":"2026-05-21T00:00:00"}
