{"id":"https://openalex.org/W4417101185","doi":"https://doi.org/10.48550/arxiv.2508.01889","title":"Medical Image De-Identification Resources: Synthetic DICOM Data and Tools for Validation","display_name":"Medical Image De-Identification Resources: Synthetic DICOM Data and Tools for Validation","publication_year":2025,"publication_date":"2025-08-03","ids":{"openalex":"https://openalex.org/W4417101185","doi":"https://doi.org/10.48550/arxiv.2508.01889"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2508.01889","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.01889","pdf_url":"https://arxiv.org/pdf/2508.01889","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.01889","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070764516","display_name":"Michael Rutherford","orcid":"https://orcid.org/0000-0003-2665-753X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rutherford, Michael W.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031611715","display_name":"Tracy S. Nolan","orcid":"https://orcid.org/0000-0002-7023-7586"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nolan, Tracy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045820623","display_name":"Linmin Pei","orcid":"https://orcid.org/0000-0001-6135-9429"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pei, Linmin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045002278","display_name":"Ulrike Wagner","orcid":"https://orcid.org/0000-0002-3230-5058"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wagner, Ulrike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100871247","display_name":"Qinyan Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Qinyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001424327","display_name":"Phillip Farmer","orcid":"https://orcid.org/0000-0003-1448-1346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farmer, Phillip","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027374679","display_name":"Kirk Smith","orcid":"https://orcid.org/0000-0002-8735-7576"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Smith, Kirk","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036757105","display_name":"Benjamin Kopchick","orcid":"https://orcid.org/0000-0003-1125-0155"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kopchick, Benjamin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066723497","display_name":"Laura Opsahl-Ong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Opsahl-Ong, Laura","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028284504","display_name":"Granger Sutton","orcid":"https://orcid.org/0000-0001-7498-8048"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sutton, Granger","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013106687","display_name":"David Clunie","orcid":"https://orcid.org/0000-0002-2406-1145"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Clunie, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030981069","display_name":"Keyvan Farahani","orcid":"https://orcid.org/0000-0003-2111-1896"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farahani, Keyvan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5063662396","display_name":"Fred Prior","orcid":"https://orcid.org/0000-0002-6314-5683"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Prior, Fred","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5070764516"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12422","display_name":"Radiomics and Machine Learning in Medical Imaging","score":0.23170000314712524,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T12422","display_name":"Radiomics and Machine Learning in Medical Imaging","score":0.23170000314712524,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.18119999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11361","display_name":"Digital Radiography and Breast Imaging","score":0.12330000102519989,"subfield":{"id":"https://openalex.org/subfields/2740","display_name":"Pulmonary and Respiratory Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dicom","display_name":"DICOM","score":0.9478999972343445},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.6164000034332275},{"id":"https://openalex.org/keywords/confidentiality","display_name":"Confidentiality","score":0.49729999899864197},{"id":"https://openalex.org/keywords/data-sharing","display_name":"Data sharing","score":0.4781000018119812},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.3937000036239624},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.37940001487731934},{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.362199991941452},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.3569999933242798},{"id":"https://openalex.org/keywords/image-file-formats","display_name":"Image file formats","score":0.3443000018596649}],"concepts":[{"id":"https://openalex.org/C77331912","wikidata":"https://www.wikidata.org/wiki/Q81095","display_name":"DICOM","level":2,"score":0.9478999972343445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.683899998664856},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.6164000034332275},{"id":"https://openalex.org/C71745522","wikidata":"https://www.wikidata.org/wiki/Q2476929","display_name":"Confidentiality","level":2,"score":0.49729999899864197},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.4781000018119812},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4065999984741211},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.3937000036239624},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.37940001487731934},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.362199991941452},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3569999933242798},{"id":"https://openalex.org/C65377053","wikidata":"https://www.wikidata.org/wiki/Q1572121","display_name":"Image file formats","level":3,"score":0.3443000018596649},{"id":"https://openalex.org/C112416745","wikidata":"https://www.wikidata.org/wiki/Q974213","display_name":"Digital imaging","level":5,"score":0.3425000011920929},{"id":"https://openalex.org/C123201435","wikidata":"https://www.wikidata.org/wiki/Q456632","display_name":"Information privacy","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3215999901294708},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.3125},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.31200000643730164},{"id":"https://openalex.org/C42781572","wikidata":"https://www.wikidata.org/wiki/Q1250322","display_name":"Digital image","level":4,"score":0.30079999566078186},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C91632574","wikidata":"https://www.wikidata.org/wiki/Q15088675","display_name":"Data curation","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C69360830","wikidata":"https://www.wikidata.org/wiki/Q1172237","display_name":"Data Protection Act 1998","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C163763905","wikidata":"https://www.wikidata.org/wiki/Q17075943","display_name":"Precision medicine","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C92446256","wikidata":"https://www.wikidata.org/wiki/Q3306762","display_name":"Data validation","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C2987933465","wikidata":"https://www.wikidata.org/wiki/Q141130","display_name":"Image manipulation","level":3,"score":0.25859999656677246},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C2778306010","wikidata":"https://www.wikidata.org/wiki/Q606563","display_name":"Health Insurance Portability and Accountability Act","level":3,"score":0.25360000133514404},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2508.01889","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.01889","pdf_url":"https://arxiv.org/pdf/2508.01889","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.01889","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.01889","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.01889","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.01889","pdf_url":"https://arxiv.org/pdf/2508.01889","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Medical":[0,118],"imaging":[1,159],"research":[2],"increasingly":[3],"depends":[4],"on":[5,85],"large-scale":[6],"data":[7,27,39,129,172,176,180,211],"sharing":[8],"to":[9,74,181],"promote":[10],"reproducibility":[11,89],"and":[12,31,49,55,68,82,90,108,150,161,166,178,202,231,245],"train":[13],"Artificial":[14],"Intelligence":[15],"(AI)":[16],"models.":[17],"Ensuring":[18],"patient":[19],"privacy":[20],"remains":[21],"a":[22,195],"significant":[23],"challenge":[24],"for":[25,41,112,141,144],"open-access":[26],"sharing.":[28,250],"Digital":[29],"Imaging":[30,133],"Communications":[32],"in":[33],"Medicine":[34],"(DICOM),":[35],"the":[36,220],"global":[37],"standard":[38],"format":[40],"medical":[42,248],"imaging,":[43],"encodes":[44],"both":[45],"essential":[46],"clinical":[47],"metadata":[48],"extensive":[50],"protected":[51],"health":[52],"information":[53,58],"(PHI)":[54],"personally":[56],"identifiable":[57],"(PII).":[59],"Effective":[60],"de-identification":[61,115,120,241],"must":[62],"remove":[63],"identifiers,":[64],"preserve":[65],"scientific":[66],"utility,":[67],"maintain":[69],"DICOM":[70,102,152,227],"validity.":[71],"Tools":[72],"exist":[73],"perform":[75],"de-identification,":[76],"but":[77],"few":[78],"assess":[79],"its":[80],"effectiveness,":[81],"most":[83],"rely":[84],"subjective":[86],"reviews,":[87],"limiting":[88],"regulatory":[91],"confidence.":[92],"To":[93],"address":[94],"this":[95],"gap,":[96],"we":[97],"developed":[98],"an":[99,109],"openly":[100],"accessible":[101],"dataset":[103,122],"infused":[104],"with":[105,219],"synthetic":[106],"PHI/PII":[107],"evaluation":[110,192,239],"framework":[111,216],"benchmarking":[113],"image":[114,153,249],"workflows.":[116],"The":[117,131,215],"Image":[119],"(MIDI)":[121],"was":[123],"built":[124],"using":[125],"publicly":[126],"available":[127],"de-identified":[128],"from":[130],"Cancer":[132],"Archive":[134],"(TCIA).":[135],"It":[136,235],"includes":[137],"538":[138],"subjects":[139],"(216":[140],"validation,":[142],"322":[143],"testing),":[145],"605":[146],"studies,":[147],"708":[148],"series,":[149],"53,581":[151],"instances.":[154],"These":[155],"span":[156],"multiple":[157],"vendors,":[158],"modalities,":[160],"cancer":[162],"types.":[163],"Synthetic":[164],"PHI":[165],"PII":[167],"were":[168],"embedded":[169],"into":[170],"structured":[171],"elements,":[173,177],"plain":[174],"text":[175],"pixel":[179],"simulate":[182],"real-world":[183],"identity":[184],"leaks":[185],"encountered":[186],"by":[187],"TCIA":[188,232],"curation":[189],"teams.":[190],"Accompanying":[191],"tools":[193],"include":[194],"Python":[196],"script,":[197],"answer":[198],"keys":[199],"(known":[200],"truth),":[201],"mapping":[203],"files":[204],"that":[205],"enable":[206],"automated":[207],"comparison":[208],"of":[209,240],"curated":[210],"against":[212],"expected":[213],"transformations.":[214],"is":[217],"aligned":[218],"HIPAA":[221],"Privacy":[222],"Rule":[223],"\"Safe":[224],"Harbor\"":[225],"method,":[226],"PS3.15":[228],"Confidentiality":[229],"Profiles,":[230],"best":[233],"practices.":[234],"supports":[236],"objective,":[237],"standards-driven":[238],"workflows,":[242],"promoting":[243],"safer":[244],"more":[246],"consistent":[247]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
