{"id":"https://openalex.org/W7160554160","doi":"https://doi.org/10.48550/arxiv.2605.04180","title":"MedFabric and EtHER: A Data-Centric Framework for Word-Level Fabrication Generation and Detection in Medical LLMs","display_name":"MedFabric and EtHER: A Data-Centric Framework for Word-Level Fabrication Generation and Detection in Medical LLMs","publication_year":2026,"publication_date":"2026-05-05","ids":{"openalex":"https://openalex.org/W7160554160","doi":"https://doi.org/10.48550/arxiv.2605.04180"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04180","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04180","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04180","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135594337","display_name":"Tung Sum Thomas Kwok","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwok, Tung Sum Thomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135629462","display_name":"Qian Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Qian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135586659","display_name":"Xiaofeng Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Xiaofeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135604352","display_name":"Dongxu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Dongxu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135568297","display_name":"Jun Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135571876","display_name":"Zhichao Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Zhichao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135631233","display_name":"Davin Hill","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hill, Davin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103166669","display_name":"Tamer Soliman","orcid":"https://orcid.org/0009-0004-9292-3941"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Soliman, Tamer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042529162","display_name":"Sanjit Singh Batra","orcid":"https://orcid.org/0000-0001-9849-865X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Batra, Sanjit Singh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040732282","display_name":"R. Tillman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tillman, Robert","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135623021","display_name":"Guang Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Guang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.6037999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.6037999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.04280000180006027,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.03999999910593033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5746999979019165},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5598000288009644},{"id":"https://openalex.org/keywords/hallucinating","display_name":"Hallucinating","score":0.5406000018119812},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.44670000672340393},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4260999858379364},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.3935000002384186},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.3905999958515167}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794000267982483},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5746999979019165},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5598000288009644},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.5406000018119812},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.44670000672340393},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43309998512268066},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4260999858379364},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.3935000002384186},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3912000060081482},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.3905999958515167},{"id":"https://openalex.org/C136525101","wikidata":"https://www.wikidata.org/wiki/Q5428139","display_name":"Fabrication","level":3,"score":0.36480000615119934},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.3456000089645386},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.3165999948978424},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2590999901294708}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04180","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04180","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04180","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04180","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7682435512542725,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"exhibit":[3],"strong":[4],"reasoning":[5],"and":[6,54,57,75,81,109,111,148],"semantic":[7],"understanding":[8],"capabilities":[9],"but":[10],"often":[11],"hallucinate":[12],"in":[13,34,90],"domains":[14],"that":[15,78,123],"require":[16],"expert":[17],"knowledge,":[18],"among":[19],"which":[20],"fabrications,":[21],"the":[22,31],"generation":[23],"of":[24],"factually":[25],"incorrect":[26],"yet":[27],"fluent":[28],"statements,":[29],"pose":[30],"greatest":[32],"risk":[33],"medical":[35,38],"contexts.":[36],"Existing":[37],"hallucination":[39],"datasets":[40],"inadequately":[41],"capture":[42],"fabrication":[43,48,102,133],"phenomena":[44],"due":[45],"to":[46,72,116],"limited":[47],"coverage,":[49],"stylistic":[50,82],"disparities":[51],"between":[52],"human":[53],"LLM-authored":[55],"texts,":[56],"distributional":[58],"drift":[59],"during":[60],"hallucinated":[61],"sample":[62],"synthesis.":[63],"To":[64],"address":[65],"this,":[66],"we":[67,96],"propose":[68],"a":[69,99,143],"data-centric":[70],"pipeline":[71],"generate":[73],"realistic":[74],"word-level":[76,101,132],"fabrications":[77],"preserve":[79],"syntactic":[80],"fidelity":[83],"while":[84,135],"introducing":[85],"subtle":[86],"factual":[87,118],"deviations,":[88],"resulting":[89],"MedFabric.":[91],"Building":[92],"upon":[93],"this":[94],"dataset,":[95],"introduce":[97],"ETHER,":[98],"modular":[100],"detector":[103],"integrating":[104],"Text2Table":[105],"Decomposition,":[106],"Word":[107],"Masking":[108],"Filling":[110],"Hybrid":[112],"Sentence":[113],"Pair":[114],"Evaluation":[115],"enhance":[117],"alignment.":[119],"Empirical":[120],"results":[121],"demonstrate":[122],"MedFabric":[124],"outperforms":[125],"state-of-the-art":[126],"detectors":[127],"by":[128],"over":[129],"15%":[130],"on":[131],"benchmarks":[134],"maintaining":[136],"consistent":[137],"performance":[138],"across":[139],"structural":[140],"similarities,":[141],"offering":[142],"comprehensive":[144],"framework":[145],"for":[146],"reliable":[147],"domain-specific":[149],"factuality":[150],"detection.":[151]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-08T00:00:00"}
