{"id":"https://openalex.org/W4406458720","doi":"https://doi.org/10.1109/bigdata62323.2024.10825249","title":"Private Synthetic Data Generation for Mixed Type Datasets","display_name":"Private Synthetic Data Generation for Mixed Type Datasets","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406458720","doi":"https://doi.org/10.1109/bigdata62323.2024.10825249"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825249","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825249","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045662127","display_name":"Irene Tenison","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Irene Tenison","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070627277","display_name":"A. I. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashley Chen","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904554","display_name":"Navpreet Singh","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Navpreet Singh","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115904555","display_name":"Omar Dahleh","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Omar Dahleh","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092579780","display_name":"Eliott Zemour","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eliott Zemour","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013709154","display_name":"Lalana Kagal","orcid":"https://orcid.org/0000-0001-8469-1993"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lalana Kagal","raw_affiliation_strings":["Massachusetts Institute of Technology,Cambridge,MA"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology,Cambridge,MA","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5045662127"],"corresponding_institution_ids":["https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.70782466,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"6379","last_page":"6386"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9197999835014343,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6079505085945129},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4484640061855316},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.435497522354126},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23050272464752197},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12419801950454712}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6079505085945129},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4484640061855316},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.435497522354126},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23050272464752197},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12419801950454712}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825249","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825249","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W128638292","https://openalex.org/W1873763122","https://openalex.org/W2154652894","https://openalex.org/W2473418344","https://openalex.org/W2752442988","https://openalex.org/W2789028076","https://openalex.org/W2806276686","https://openalex.org/W2946930197","https://openalex.org/W2950397305","https://openalex.org/W2963091658","https://openalex.org/W2963541420","https://openalex.org/W2963592583","https://openalex.org/W2998378988","https://openalex.org/W3096831136","https://openalex.org/W3123788974","https://openalex.org/W3157988161","https://openalex.org/W3163824215","https://openalex.org/W3173004511","https://openalex.org/W3178949368","https://openalex.org/W3193647133","https://openalex.org/W4254943607","https://openalex.org/W4283172211","https://openalex.org/W4283805899","https://openalex.org/W4283816219","https://openalex.org/W4287888099","https://openalex.org/W4288089799","https://openalex.org/W4288296172","https://openalex.org/W4298166788","https://openalex.org/W4317940312","https://openalex.org/W4318147773","https://openalex.org/W4318596157","https://openalex.org/W4378465287","https://openalex.org/W4378505437","https://openalex.org/W4383469362","https://openalex.org/W4384918448","https://openalex.org/W4385569941","https://openalex.org/W4385571534","https://openalex.org/W4385573108","https://openalex.org/W4387596201","https://openalex.org/W6682631176","https://openalex.org/W6745910440","https://openalex.org/W6747047132","https://openalex.org/W6763393573","https://openalex.org/W6765451912","https://openalex.org/W6769627184","https://openalex.org/W6797936153","https://openalex.org/W6799631579","https://openalex.org/W6801292351","https://openalex.org/W6802709103","https://openalex.org/W6839294834","https://openalex.org/W6839820251","https://openalex.org/W6846546667","https://openalex.org/W6847333945","https://openalex.org/W6849005259","https://openalex.org/W6853608320","https://openalex.org/W6853794594","https://openalex.org/W6854866820","https://openalex.org/W6857318322","https://openalex.org/W6898505805"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W3109499659","https://openalex.org/W4382315317","https://openalex.org/W2966641257","https://openalex.org/W4399530423"],"abstract_inverted_index":{"In":[0],"the":[1,43,50,111,182],"face":[2],"of":[3,87,113,115,211],"escalating":[4],"threats":[5],"from":[6,82],"privacy":[7,55],"attacks":[8],"on":[9,122,221],"machine":[10],"learning":[11],"models,":[12],"we":[13],"propose":[14],"a":[15,73,139,208],"system":[16,121,161],"that":[17,22,61,85,159,167,219],"can":[18,101,186],"artificially":[19],"generate":[20],"data":[21,25,68,99,185,190,200],"imitates":[23],"real":[24],"but":[26,53],"doesn\u2019t":[27],"contain":[28],"any":[29],"sensitive":[30,116,222],"or":[31,66,91],"personally":[32],"identifiable":[33],"information.":[34],"The":[35,96],"generated":[36,100,183],"data,":[37,40],"called":[38],"synthetic":[39,80,98,165,184],"will":[41],"have":[42],"same":[44],"semantic":[45],"and":[46,93,106,125,129,135,147,193,204,216],"statistical":[47],"distribution":[48],"as":[49,175,177],"original":[51],"dataset":[52],"provide":[54],"guarantees.":[56],"Compared":[57],"to":[58,143,153,195,199],"previous":[59],"works":[60],"dealt":[62],"with":[63,151],"either":[64],"structured":[65,89],"unstructured":[67,94],"separately,":[69],"our":[70,120,160],"work":[71],"develops":[72],"complete":[74],"hybrid":[75],"pipeline":[76],"for":[77,132],"generating":[78],"private":[79,97,164],"datasets":[81,84,128,166],"complex":[83],"consist":[86],"both":[88,133],"(numerical":[90],"categorical)":[92],"data.":[95,117,223],"be":[102,187],"analyzed":[103],"by":[104,189],"collaborators":[105],"third":[107],"parties":[108],"without":[109],"increasing":[110],"risks":[112],"leakage":[114],"We":[118,137],"evaluate":[119,154],"Yelp":[123],"reviews":[124],"drug":[126],"side-effects":[127],"calculate":[130],"metrics":[131],"quality":[134],"privacy.":[136,155,178],"introduce":[138],"context-aware":[140],"exposure":[141,152],"metric":[142],"quantify":[144],"context-dependent":[145],"memorization":[146],"use":[148],"it":[149],"along":[150],"Our":[156],"evaluations":[157],"demonstrate":[158],"generates":[162],"meaningful":[163],"achieve":[168],"good":[169],"performance":[170],"in":[171,207],"characteristic":[172],"similarity,":[173],"utility,":[174],"well":[176],"Given":[179],"these":[180],"results,":[181],"used":[188],"scientists,":[191],"researchers,":[192],"developers":[194],"address":[196],"challenges":[197],"related":[198],"privacy,":[201],"scarcity,":[202],"diversity,":[203],"model":[205],"testing":[206],"wide":[209],"range":[210],"applications":[212],"including":[213],"healthcare,":[214],"insurance,":[215],"financial":[217],"systems":[218],"rely":[220]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
