{"id":"https://openalex.org/W7148755413","doi":"https://doi.org/10.48550/arxiv.2604.01481","title":"DISCO-TAB: A Hierarchical Reinforcement Learning Framework for Privacy-Preserving Synthesis of Complex Clinical Data","display_name":"DISCO-TAB: A Hierarchical Reinforcement Learning Framework for Privacy-Preserving Synthesis of Complex Clinical Data","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148755413","doi":"https://doi.org/10.48550/arxiv.2604.01481"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01481","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01481","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01481","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132875800","display_name":"Arshia Ilaty","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ilaty, Arshia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132837766","display_name":"Hossein Shirazi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shirazi, Hossein","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132877876","display_name":"Amir Rahmani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahmani, Amir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5001028658","display_name":"Hajar Homayouni","orcid":"https://orcid.org/0000-0001-8898-9498"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Homayouni, Hajar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9107999801635742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9107999801635742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.020899999886751175,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.014499999582767487,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.5202999711036682},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5148000121116638},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.4846999943256378},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.43880000710487366},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.41749998927116394},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.37610000371932983},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.36340001225471497},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.3549000024795532}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6894999742507935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5748999714851379},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5748000144958496},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.5202999711036682},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5148000121116638},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.4846999943256378},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.43880000710487366},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.41749998927116394},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.37610000371932983},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3549000024795532},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.32109999656677246},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.2881999909877777},{"id":"https://openalex.org/C2780440489","wikidata":"https://www.wikidata.org/wiki/Q5227278","display_name":"Data-driven","level":2,"score":0.28630000352859497},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.25540000200271606}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01481","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01481","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01481","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01481","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.6540537476539612,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"development":[1],"of":[2,14],"robust":[3,177],"clinical":[4,159],"decision":[5],"support":[6],"systems":[7],"is":[8],"frequently":[9],"impeded":[10],"by":[11],"the":[12,38],"scarcity":[13],"high-fidelity,":[15],"privacy-preserving":[16],"biomedical":[17],"data.":[18],"While":[19],"Generative":[20],"Large":[21],"Language":[22],"Models":[23],"(LLMs)":[24],"offer":[25],"a":[26,72,77,81,186],"promising":[27],"avenue":[28],"for":[29,69,189,196],"synthetic":[30,193],"data":[31,195],"generation,":[32],"they":[33],"often":[34],"struggle":[35],"to":[36,53,116,154,163,179],"capture":[37],"complex,":[39],"non-linear":[40],"dependencies":[41],"and":[42,105,112,122,165,176],"severe":[43],"class":[44],"imbalances":[45],"inherent":[46],"in":[47,157],"Electronic":[48],"Health":[49],"Records":[50],"(EHR),":[51],"leading":[52],"statistically":[54],"plausible":[55],"but":[56],"clinically":[57],"invalid":[58],"records.":[59],"To":[60],"bridge":[61],"this":[62],"gap,":[63],"we":[64],"introduce":[65],"DISCO-TAB":[66,96],"(DIScriminator-guided":[67],"COntrol":[68],"TABular":[70],"synthesis),":[71],"novel":[73],"framework":[74,130],"that":[75,146],"orchestrates":[76],"fine-tuned":[78],"LLM":[79],"with":[80],"multi-objective":[82],"discriminator":[83],"system":[84],"optimized":[85],"via":[86],"Reinforcement":[87],"Learning.":[88],"Unlike":[89],"prior":[90],"methods":[91],"relying":[92],"on":[93],"scalar":[94],"feedback,":[95],"evaluates":[97],"synthesis":[98],"at":[99],"four":[100],"granularities,":[101],"token,":[102],"sentence,":[103],"feature,":[104],"row,":[106],"while":[107,168],"integrating":[108],"Automated":[109],"Constraint":[110],"Discovery":[111],"Inverse-Frequency":[113],"Reward":[114],"Shaping":[115],"autonomously":[117],"preserve":[118],"latent":[119],"medical":[120,137],"logic":[121],"resolve":[123],"minority-class":[124],"collapse.":[125],"We":[126],"rigorously":[127],"validate":[128],"our":[129],"across":[131],"diverse":[132],"benchmarks,":[133],"including":[134],"high-dimensional,":[135],"small-sample":[136],"datasets":[138],"(e.g.,":[139],"Heart":[140],"Failure,":[141],"Parkinson's).":[142],"Our":[143],"results":[144],"demonstrate":[145],"hierarchical":[147],"feedback":[148],"yields":[149],"state-of-the-art":[150],"performance,":[151],"achieving":[152],"up":[153],"38.2%":[155],"improvement":[156],"downstream":[158],"classifier":[160],"utility":[161],"compared":[162],"GAN":[164],"Diffusion":[166],"baselines,":[167],"ensuring":[169],"exceptional":[170],"statistical":[171],"fidelity":[172],"(JSD":[173],"&lt;":[174],"0.01)":[175],"resistance":[178],"membership":[180],"inference":[181],"attacks.":[182],"This":[183],"work":[184],"establishes":[185],"new":[187],"standard":[188],"generating":[190],"trustworthy,":[191],"utility-preserving":[192],"tabular":[194],"sensitive":[197],"healthcare":[198],"applications.":[199]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-04T00:00:00"}
