{"id":"https://openalex.org/W7138298043","doi":"https://doi.org/10.1609/aaai.v40i15.38302","title":"GEMA-Score: Granular Explainable Multi-Agent Scoring Framework for Radiology Report Evaluation","display_name":"GEMA-Score: Granular Explainable Multi-Agent Scoring Framework for Radiology Report Evaluation","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138298043","doi":"https://doi.org/10.1609/aaai.v40i15.38302"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i15.38302","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38302","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i15.38302","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114973376","display_name":"Zhenxuan Zhang","orcid":"https://orcid.org/0009-0002-2904-2848"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zhenxuan Zhang","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026770176","display_name":"Kinhei Lee","orcid":"https://orcid.org/0009-0000-6832-9863"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"KinHei Lee","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065454976","display_name":"Peiyuan Jing","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Peiyuan Jing","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125719277","display_name":"Weihang Deng","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Weihang Deng","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129656094","display_name":"Huichi Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Huichi Zhou","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129689730","display_name":"Zihao Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zihao Jin","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129664969","display_name":"Jiahao Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jiahao Huang","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049053722","display_name":"Zhifan Gao","orcid":"https://orcid.org/0000-0002-1576-4439"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhifan Gao","raw_affiliation_strings":["School of Biomedical Engineering, Sun Yat-sen University, China"],"affiliations":[{"raw_affiliation_string":"School of Biomedical Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129713219","display_name":"Dominic C. Marshall","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Dominic C. Marshall","raw_affiliation_strings":["Department of Surgery & Cancer, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Surgery & Cancer, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129599417","display_name":"Yingying Fang","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yingying Fang","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129672267","display_name":"Guang Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Guang Yang","raw_affiliation_strings":["Department of Bioengineering, Imperial College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Bioengineering, Imperial College London, UK","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5114973376"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.50910064,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"15","first_page":"13025","last_page":"13033"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2540999948978424,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2540999948978424,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.1517000049352646,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.14569999277591705,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/terminology","display_name":"Terminology","score":0.6972000002861023},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.6110000014305115},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5396999716758728},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.47200000286102295}],"concepts":[{"id":"https://openalex.org/C547195049","wikidata":"https://www.wikidata.org/wiki/Q1725664","display_name":"Terminology","level":2,"score":0.6972000002861023},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.6110000014305115},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.546999990940094},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5396999716758728},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41850000619888306},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.4099999964237213},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3962000012397766},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3061000108718872},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.29409998655319214},{"id":"https://openalex.org/C3018395757","wikidata":"https://www.wikidata.org/wiki/Q1379672","display_name":"Evaluation methods","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.25760000944137573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i15.38302","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38302","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i15.38302","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i15.38302","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6331790685653687,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automatic":[0],"medical":[1],"report":[2],"generation":[3],"has":[4],"the":[5,12,31,152],"potential":[6,18],"to":[7,29,65,123],"support":[8],"clinical":[9,32,68,78,140,171],"diagnosis,":[10,126],"reduce":[11],"workload":[13],"of":[14,34,119],"radiologists,":[15],"and":[16,97,112,129,139],"demonstrate":[17],"for":[19],"enhancing":[20],"diagnostic":[21,45,53],"consistency.":[22],"However,":[23],"current":[24],"evaluation":[25,99],"metrics":[26,46,54,71],"often":[27],"fail":[28],"reflect":[30],"reliability":[33],"generated":[35],"reports.":[36],"Overlap-based":[37],"methods":[38],"overlook":[39],"fine-grained":[40],"details":[41],"(e.g.,":[42],"location,":[43,127],"severity),":[44],"are":[47,55],"constrained":[48],"by":[49,57],"fixed":[50,58],"vocabularies.":[51],"Some":[52],"limited":[56],"vocabularies":[59],"or":[60],"templates,":[61],"reducing":[62],"their":[63],"ability":[64],"capture":[66],"diverse":[67],"expressions.":[69],"LLM-based":[70,133],"lack":[72],"interpretable":[73],"reasoning,":[74],"limiting":[75],"trust":[76],"in":[77,89],"settings.":[79],"Therefore,":[80],"we":[81],"propose":[82],"a":[83,101],"Granular":[84],"Explainable":[85],"Multi-Agent":[86],"Score":[87],"(GEMA-Score)":[88],"this":[90],"paper,":[91],"which":[92],"conducts":[93],"both":[94],"objective":[95],"quantification":[96],"subjective":[98],"through":[100,116],"large":[102],"language":[103],"model-based":[104],"multi-agent":[105],"workflow.":[106],"Our":[107],"GEMA-Score":[108,150],"parses":[109],"structured":[110],"reports":[111],"employs":[113],"stable":[114],"calculations":[115],"interactive":[117],"exchanges":[118],"information":[120],"among":[121],"agents":[122],"assess":[124],"disease":[125],"severity,":[128],"uncertainty.":[130],"Additionally,":[131],"an":[132],"scoring":[134,172],"agent":[135],"evaluates":[136],"completeness,":[137],"readability,":[138],"terminology":[141],"while":[142],"providing":[143],"explanatory":[144],"feedback.":[145],"Extensive":[146],"experiments":[147],"show":[148],"that":[149],"achieves":[151],"highest":[153],"correlation":[154],"with":[155],"human":[156],"experts":[157],"on":[158,164,167],"public":[159],"datasets":[160],"(Kendall":[161],"=":[162],"0.69":[163],"ReXVal;":[165],"0.45":[166],"RadEvalX),":[168],"demonstrating":[169],"improved":[170],"reliability.":[173]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
