{"id":"https://openalex.org/W7127995352","doi":"https://doi.org/10.48550/arxiv.2602.05692","title":"MedErrBench: A Fine-Grained Multilingual Benchmark for Medical Error Detection and Correction with Clinical Expert Annotations","display_name":"MedErrBench: A Fine-Grained Multilingual Benchmark for Medical Error Detection and Correction with Clinical Expert Annotations","publication_year":2026,"publication_date":"2026-02-05","ids":{"openalex":"https://openalex.org/W7127995352","doi":"https://doi.org/10.48550/arxiv.2602.05692"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.05692","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023786339","display_name":"Congbo Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Congbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125203970","display_name":"Yichun Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yichun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120054811","display_name":"Yousef Al-Jazzazi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Al-Jazzazi, Yousef","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125069724","display_name":"Ahamed Foisal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Foisal, Ahamed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125163099","display_name":"Laasya Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Laasya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125143205","display_name":"Yousra Sadqi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sadqi, Yousra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112894406","display_name":"Khaled Ahmed Saleh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saleh, Khaled","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124877098","display_name":"Jihad Mallat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mallat, Jihad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5023660328","display_name":"Farah E. Shamout","orcid":"https://orcid.org/0000-0002-6076-725X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shamout, Farah E.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5023786339"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.4702000021934509,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.4702000021934509,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.218299999833107,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.19609999656677246,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6525999903678894},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.49810001254081726},{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.4537000060081482},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.4194999933242798},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.3686999976634979},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.3626999855041504},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.35589998960494995}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7925999760627747},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6525999903678894},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5720999836921692},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5236999988555908},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.49810001254081726},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.4537000060081482},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4259999990463257},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.4194999933242798},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.3686999976634979},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35830000042915344},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.35589998960494995},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.32989999651908875},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2888999879360199},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2833999991416931},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.28040000796318054},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.26969999074935913},{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.26100000739097595}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.05692","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.05692","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.05692","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.05692","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7512990236282349,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Inaccuracies":[0],"in":[1,127,166],"existing":[2],"or":[3,19],"generated":[4],"clinical":[5,94,151],"text":[6],"may":[7],"lead":[8],"to":[9,148,153],"serious":[10],"adverse":[11],"consequences,":[12],"especially":[13,47],"if":[14],"it":[15],"is":[16,40,164,176],"a":[17,107],"misdiagnosis":[18],"incorrect":[20],"treatment":[21],"suggestion.":[22],"With":[23],"Large":[24],"Language":[25],"Models":[26],"(LLMs)":[27],"increasingly":[28],"being":[29],"used":[30],"across":[31,48,116],"diverse":[32,49],"healthcare":[33,160],"applications,":[34],"comprehensive":[35],"evaluation":[36,143],"through":[37],"dedicated":[38],"benchmarks":[39],"crucial.":[41],"However,":[42],"such":[43],"datasets":[44],"remain":[45],"scarce,":[46],"languages":[50],"and":[51,67,90,97,112,141,156],"contexts.":[52],"In":[53],"this":[54],"paper,":[55],"we":[56,146],"introduce":[57],"MedErrBench,":[58],"the":[59,71,104,131,167,174],"first":[60],"multilingual":[61,150],"benchmark":[62],"for":[63,133],"error":[64,84],"detection,":[65],"localization,":[66],"correction,":[68],"developed":[69],"under":[70],"guidance":[72],"of":[73,81,106,109,173],"experienced":[74],"clinicians.":[75],"Based":[76],"on":[77],"an":[78],"expanded":[79],"taxonomy":[80],"ten":[82],"common":[83],"types,":[85],"MedErrBench":[86,140],"covers":[87],"English,":[88],"Arabic":[89],"Chinese,":[91],"with":[92],"natural":[93],"cases":[95],"annotated":[96],"reviewed":[98],"by":[99],"domain":[100],"experts.":[101],"We":[102],"assessed":[103],"performance":[105,124],"range":[108],"general-purpose,":[110],"language-specific,":[111],"medical-domain":[113],"language":[114],"models":[115],"all":[117],"three":[118],"tasks.":[119],"Our":[120],"results":[121],"reveal":[122],"notable":[123],"gaps,":[125],"particularly":[126],"non-English":[128],"settings,":[129],"highlighting":[130],"need":[132],"clinically":[134],"grounded,":[135],"language-aware":[136],"systems.":[137],"By":[138],"making":[139],"our":[142],"protocols":[144],"publicly-available,":[145],"aim":[147],"advance":[149],"NLP":[152],"promote":[154],"safer":[155],"more":[157],"equitable":[158],"AI-based":[159],"globally.":[161],"The":[162],"dataset":[163,175],"available":[165,177],"supplementary":[168],"material.":[169],"An":[170],"anonymized":[171],"version":[172],"at:":[178],"https://github.com/congboma/MedErrBench.":[179]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-07T00:00:00"}
