{"id":"https://openalex.org/W7126068000","doi":"https://doi.org/10.1109/bibm66473.2025.11356281","title":"MedKRG: A Knowledge and Retrieval-Guided Framework for Electronic Health Record Synthesis","display_name":"MedKRG: A Knowledge and Retrieval-Guided Framework for Electronic Health Record Synthesis","publication_year":2025,"publication_date":"2025-12-15","ids":{"openalex":"https://openalex.org/W7126068000","doi":"https://doi.org/10.1109/bibm66473.2025.11356281"},"language":null,"primary_location":{"id":"doi:10.1109/bibm66473.2025.11356281","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356281","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073837165","display_name":"Fengyu Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fengyu Lu","raw_affiliation_strings":["School of Business, Central South University,Changsha,China"],"affiliations":[{"raw_affiliation_string":"School of Business, Central South University,Changsha,China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124280891","display_name":"Jiaxin Duan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101356","display_name":"Beijing Founder Electronics (China)","ror":"https://ror.org/00nwrzz95","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210101356"]},{"id":"https://openalex.org/I4210159156","display_name":"System Equipment (China)","ror":"https://ror.org/04m2bcn74","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210159156"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxin Duan","raw_affiliation_strings":["China Electronics System Technology Co., Ltd,Research and Development Department,Beijing,China"],"affiliations":[{"raw_affiliation_string":"China Electronics System Technology Co., Ltd,Research and Development Department,Beijing,China","institution_ids":["https://openalex.org/I4210159156","https://openalex.org/I4210101356"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5073837165"],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.87377858,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2594","last_page":"2601"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.009700000286102295,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10350","display_name":"Electronic Health Records Systems","score":0.005200000014156103,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/health-records","display_name":"Health records","score":0.593500018119812},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5069000124931335},{"id":"https://openalex.org/keywords/electronic-health-record","display_name":"Electronic health record","score":0.46560001373291016},{"id":"https://openalex.org/keywords/meaningful-use","display_name":"Meaningful use","score":0.46459999680519104},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.44850000739097595},{"id":"https://openalex.org/keywords/medical-record","display_name":"Medical record","score":0.4156999886035919},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.39660000801086426},{"id":"https://openalex.org/keywords/scarcity","display_name":"Scarcity","score":0.39579999446868896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6682999730110168},{"id":"https://openalex.org/C3019952477","wikidata":"https://www.wikidata.org/wiki/Q1324077","display_name":"Health records","level":3,"score":0.593500018119812},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5069000124931335},{"id":"https://openalex.org/C3020144179","wikidata":"https://www.wikidata.org/wiki/Q10871684","display_name":"Electronic health record","level":3,"score":0.46560001373291016},{"id":"https://openalex.org/C3019659195","wikidata":"https://www.wikidata.org/wiki/Q5690566","display_name":"Meaningful use","level":3,"score":0.46459999680519104},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.44850000739097595},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.42250001430511475},{"id":"https://openalex.org/C195910791","wikidata":"https://www.wikidata.org/wiki/Q1324077","display_name":"Medical record","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.39660000801086426},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.39579999446868896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39579999446868896},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.38510000705718994},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3474999964237213},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33410000801086426},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32600000500679016},{"id":"https://openalex.org/C206497026","wikidata":"https://www.wikidata.org/wiki/Q1753883","display_name":"SNOMED CT","level":3,"score":0.31790000200271606},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.31369999051094055},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.303600013256073},{"id":"https://openalex.org/C45827449","wikidata":"https://www.wikidata.org/wiki/Q5270338","display_name":"Diagnosis code","level":3,"score":0.2831000089645386},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.2816999852657318},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C2780433410","wikidata":"https://www.wikidata.org/wiki/Q5276090","display_name":"Digital health","level":3,"score":0.25060001015663147},{"id":"https://openalex.org/C145642194","wikidata":"https://www.wikidata.org/wiki/Q870895","display_name":"Health informatics","level":3,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm66473.2025.11356281","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356281","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W4200481829","https://openalex.org/W4304192668","https://openalex.org/W4310852955","https://openalex.org/W4385573654","https://openalex.org/W4389520259","https://openalex.org/W4390607929","https://openalex.org/W4393156546","https://openalex.org/W4393160227","https://openalex.org/W4401043132","https://openalex.org/W4401100256","https://openalex.org/W4402683856","https://openalex.org/W4402684073","https://openalex.org/W4403577427","https://openalex.org/W4404781420","https://openalex.org/W4411119725","https://openalex.org/W4414360456"],"related_works":[],"abstract_inverted_index":{"Diagnosis":[0],"based":[1],"on":[2,109,173],"electronic":[3],"health":[4],"records":[5],"(EHRs)":[6],"often":[7,37],"struggles":[8],"with":[9,18,65],"data":[10,53,182],"scarcity":[11],"and":[12,51,80,83,113,141,151,183,197],"privacy":[13],"concerns,":[14],"particularly":[15],"when":[16],"dealing":[17],"rare":[19],"diseases.":[20],"Previous":[21],"approaches":[22],"using":[23,137],"artificial":[24],"intelligence":[25],"tools,":[26],"such":[27],"as":[28],"large":[29],"language":[30],"models":[31],"(LLMs),":[32],"to":[33,73,122,165,176],"generate":[34],"synthetic":[35,181],"EHRs":[36,64,71,129,157],"produce":[38],"factually":[39],"hallucinatory":[40],"content.":[41],"To":[42],"address":[43],"these":[44],"issues,":[45],"we":[46],"propose":[47],"MedKRG,":[48],"a":[49,74,94,104,114,124,138],"knowledge":[50,95,163],"retrieval-guided":[52],"synthesis":[54],"approach":[55],"that":[56],"augments":[57],"limited":[58],"EHR":[59,126],"samples.":[60],"Specifically,":[61,117],"MedKRG":[62],"creates":[63],"targeted":[66,167],"diseases":[67],"by":[68,131],"first":[69],"retrieving":[70],"similar":[72,128],"given":[75],"seed,":[76],"spanning":[77],"both":[78],"common":[79],"specific":[81],"conditions,":[82],"then":[84],"substituting":[85],"their":[86],"key":[87],"clinical":[88],"attributes":[89],"under":[90],"the":[91,134,155,162,166,178,184,201],"supervision":[92],"of":[93,100,161,180,186,203],"graph.":[96],"The":[97],"core":[98],"modules":[99],"our":[101],"framework":[102],"are":[103],"Transformer":[105],"encoder":[106],"(TE)":[107],"trained":[108],"diverse":[110],"medical":[111,139,198],"sources":[112],"powerful":[115],"LLM.":[116],"KeGES":[118],"uses":[119],"an":[120],"LLM":[121],"reconstruct":[123],"seed":[125],"from":[127],"retrieved":[130],"TE,":[132],"revisits":[133],"reconstructed":[135],"content":[136],"graph,":[140],"finally":[142],"produces":[143],"novel":[144],"EHRs.":[145],"This":[146],"loop":[147],"-":[148],"retrieval,":[149],"reconstruction,":[150],"revisiting":[152],"repeats":[153],"until":[154],"synthesized":[156],"achieve":[158],"comprehensive":[159,171],"coverage":[160],"related":[164],"disease.":[168],"We":[169],"perform":[170],"evaluations":[172],"Jarvis":[174],"datasets":[175],"assess":[177],"effectiveness":[179],"security":[185],"patient":[187,204],"privacy.":[188],"Experimental":[189],"results":[190],"demonstrate":[191],"improved":[192],"diagnostic":[193],"accuracy":[194],"across":[195],"generic":[196],"LLMs,":[199],"without":[200],"leakage":[202],"information.":[205]},"counts_by_year":[],"updated_date":"2026-02-01T03:34:12.195049","created_date":"2026-01-30T00:00:00"}
