{"id":"https://openalex.org/W7140312803","doi":"https://doi.org/10.48550/arxiv.2603.22954","title":"Privacy-Preserving EHR Data Transformation via Geometric Operators: A Human-AI Co-Design Technical Report","display_name":"Privacy-Preserving EHR Data Transformation via Geometric Operators: A Human-AI Co-Design Technical Report","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140312803","doi":"https://doi.org/10.48550/arxiv.2603.22954"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22954","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22954","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22954","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130575287","display_name":"Maolin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Maolin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130558070","display_name":"Beining Bao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bao, Beining","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130621125","display_name":"Gan Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Gan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130599898","display_name":"Hongyu Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hongyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130605793","display_name":"Bingkun Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Bingkun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130563499","display_name":"Baoshuo Kan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kan, Baoshuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130569335","display_name":"Jiming Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130561758","display_name":"Qi Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130599950","display_name":"Yinggong Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yinggong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130571419","display_name":"Yao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130553664","display_name":"Wei Ying Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Wei Ying","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130571766","display_name":"Jun Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.7483999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.7483999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.08179999887943268,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.02319999970495701,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6197999715805054},{"id":"https://openalex.org/keywords/interoperability","display_name":"Interoperability","score":0.5365999937057495},{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.5123999714851379},{"id":"https://openalex.org/keywords/data-transformation","display_name":"Data transformation","score":0.4244000017642975},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data sharing","score":0.41280001401901245},{"id":"https://openalex.org/keywords/data-anonymization","display_name":"Data anonymization","score":0.3978999853134155},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.38089999556541443},{"id":"https://openalex.org/keywords/cryptography","display_name":"Cryptography","score":0.3750999867916107},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.351500004529953}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7398999929428101},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6197999715805054},{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.5365999937057495},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.5123999714851379},{"id":"https://openalex.org/C150670458","wikidata":"https://www.wikidata.org/wiki/Q4272815","display_name":"Data transformation","level":3,"score":0.4244000017642975},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.41280001401901245},{"id":"https://openalex.org/C2776945810","wikidata":"https://www.wikidata.org/wiki/Q17006654","display_name":"Data anonymization","level":3,"score":0.3978999853134155},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39649999141693115},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C178489894","wikidata":"https://www.wikidata.org/wiki/Q8789","display_name":"Cryptography","level":2,"score":0.3750999867916107},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3537999987602234},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.351500004529953},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.34599998593330383},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.32679998874664307},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.30889999866485596},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.30799999833106995},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.30790001153945923},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3012999892234802},{"id":"https://openalex.org/C120894424","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory data analysis","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28450000286102295},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28040000796318054},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.26969999074935913},{"id":"https://openalex.org/C33884865","wikidata":"https://www.wikidata.org/wiki/Q1254335","display_name":"Cryptographic protocol","level":3,"score":0.2662999927997589},{"id":"https://openalex.org/C153876917","wikidata":"https://www.wikidata.org/wiki/Q899704","display_name":"Traceability","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C489000","wikidata":"https://www.wikidata.org/wiki/Q747385","display_name":"Data flow diagram","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.25850000977516174},{"id":"https://openalex.org/C71745522","wikidata":"https://www.wikidata.org/wiki/Q2476929","display_name":"Confidentiality","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C137314826","wikidata":"https://www.wikidata.org/wiki/Q2330408","display_name":"Data mapping","level":2,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22954","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22954","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22954","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22954","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Electronic":[0],"health":[1],"records":[2],"(EHRs)":[3],"and":[4,17,29,45,55,75,96,110,143,161,170,209,218],"other":[5],"real-world":[6],"clinical":[7,12,124],"data":[8,36,84,129],"are":[9,190],"essential":[10],"for":[11,86,119,202],"research,":[13],"medical":[14,141],"artificial":[15],"intelligence,":[16],"life":[18],"science,":[19],"but":[20,62],"their":[21,99],"sharing":[22,121],"is":[23],"severely":[24],"limited":[25],"by":[26,206],"privacy,":[27],"governance,":[28],"interoperability":[30],"constraints.":[31],"These":[32],"barriers":[33],"create":[34],"persistent":[35],"silos":[37],"that":[38,103,139,189],"hinder":[39],"multi-center":[40],"studies,":[41],"large-scale":[42,72],"model":[43],"development,":[44],"broader":[46],"biomedical":[47],"discovery.":[48],"Existing":[49],"privacy-preserving":[50,120],"approaches,":[51],"including":[52],"multi-party":[53],"computation":[54,88],"related":[56],"cryptographic":[57],"techniques,":[58],"provide":[59],"strong":[60],"protection":[61],"often":[63],"introduce":[64],"substantial":[65],"computational":[66],"overhead,":[67],"reducing":[68],"the":[69,171],"efficiency":[70],"of":[71,122,127],"machine":[73],"learning":[74],"foundation-model":[76],"training.":[77],"In":[78],"addition,":[79],"many":[80],"such":[81],"methods":[82],"make":[83],"usable":[85],"restricted":[87],"while":[89],"leaving":[90],"them":[91],"effectively":[92],"invisible":[93],"to":[94],"clinicians":[95],"researchers,":[97],"limiting":[98],"value":[100],"in":[101],"workflows":[102],"still":[104],"require":[105],"direct":[106,156],"inspection,":[107],"exploratory":[108],"analysis,":[109],"human":[111,182],"interpretation.":[112],"We":[113],"propose":[114],"a":[115,149,177],"real-world-data":[116],"transformation":[117,187],"framework":[118],"structured":[123],"records.":[125],"Instead":[126],"converting":[128],"into":[130],"opaque":[131],"representations,":[132],"our":[133],"approach":[134],"constructs":[135],"transformed":[136],"numeric":[137],"views":[138,160],"preserve":[140],"semantics":[142],"major":[144],"statistical":[145],"properties":[146],"while,":[147],"under":[148,181,212],"clearly":[150],"specified":[151],"threat":[152,194],"model,":[153,195],"provably":[154],"breaking":[155],"linkage":[157],"between":[158,167],"those":[159],"protected":[162],"patient-level":[163],"attributes.":[164],"Through":[165],"collaboration":[166],"computer":[168],"scientists":[169],"AI":[172],"agent":[173],"\\textbf{SciencePal},":[174],"acting":[175],"as":[176],"constrained":[178],"tool":[179],"inventor":[180],"guidance,":[183],"we":[184],"design":[185],"three":[186],"operators":[188],"non-reversible":[191],"within":[192],"this":[193],"together":[196],"with":[197],"an":[198],"additional":[199],"mixing":[200],"strategy":[201],"high-risk":[203],"scenarios,":[204],"supported":[205],"theoretical":[207],"analysis":[208],"empirical":[210],"evaluation":[211],"reconstruction,":[213],"record":[214],"linkage,":[215],"membership":[216],"inference,":[217],"attribute":[219],"inference":[220],"attacks.":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-26T00:00:00"}
