{"id":"https://openalex.org/W2989483391","doi":"https://doi.org/10.26615/978-954-452-056-4_030","title":"De-Identification of Emails: Pseudonymizing Privacy-Sensitive Data in a German Email Corpus","display_name":"De-Identification of Emails: Pseudonymizing Privacy-Sensitive Data in a German Email Corpus","publication_year":2019,"publication_date":"2019-10-22","ids":{"openalex":"https://openalex.org/W2989483391","doi":"https://doi.org/10.26615/978-954-452-056-4_030","mag":"2989483391"},"language":"en","primary_location":{"id":"doi:10.26615/978-954-452-056-4_030","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_030","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.26615/978-954-452-056-4_030","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Institut f\u00fcr Germanistik, Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","orcid":null},"institutions":[{"id":"https://openalex.org/I4210166741","display_name":"University of Klagenfurt","ror":"https://ror.org/05q9m0937","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210166741"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Institut f\u00fcr Germanistik, Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","raw_affiliation_strings":["Institut f\u00fcr Germanistik Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria"],"affiliations":[{"raw_affiliation_string":"Institut f\u00fcr Germanistik Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","institution_ids":["https://openalex.org/I4210166741"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066646882","display_name":"Elisabeth Eder","orcid":null},"institutions":[{"id":"https://openalex.org/I4210166741","display_name":"University of Klagenfurt","ror":"https://ror.org/05q9m0937","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210166741"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Elisabeth Eder","raw_affiliation_strings":["Institut fr Germanistik Alpen-Adria-Universitt Klagenfurt, Klagenfurt, Austria","Institut f\u00fcr Germanistik Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria"],"affiliations":[{"raw_affiliation_string":"Institut fr Germanistik Alpen-Adria-Universitt Klagenfurt, Klagenfurt, Austria","institution_ids":["https://openalex.org/I4210166741"]},{"raw_affiliation_string":"Institut f\u00fcr Germanistik Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","institution_ids":["https://openalex.org/I4210166741"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052797822","display_name":"Ulrike Krieg-Holz","orcid":null},"institutions":[{"id":"https://openalex.org/I4210166741","display_name":"University of Klagenfurt","ror":"https://ror.org/05q9m0937","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210166741"]},{"id":"https://openalex.org/I76198965","display_name":"Friedrich Schiller University Jena","ror":"https://ror.org/05qpz1x62","country_code":"DE","type":"education","lineage":["https://openalex.org/I76198965"]}],"countries":["AT","DE"],"is_corresponding":true,"raw_author_name":"Ulrike Krieg-Holz","raw_affiliation_strings":["Institut fr Germanistik Alpen-Adria-Universitt Klagenfurt, Klagenfurt, Austria","Jena University Language & Information Engineering (JULIE) Lab Friedrich-Schiller-Universit\u00e4t Jena, Jena, Germany"],"affiliations":[{"raw_affiliation_string":"Institut fr Germanistik Alpen-Adria-Universitt Klagenfurt, Klagenfurt, Austria","institution_ids":["https://openalex.org/I4210166741"]},{"raw_affiliation_string":"Jena University Language & Information Engineering (JULIE) Lab Friedrich-Schiller-Universit\u00e4t Jena, Jena, Germany","institution_ids":["https://openalex.org/I76198965"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Institut f\u00fcr Germanistik, Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Institut f\u00fcr Germanistik, Alpen-Adria-Universit\u00e4t Klagenfurt, Klagenfurt, Austria","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044841280","display_name":"Udo Hahn","orcid":"https://orcid.org/0000-0002-5052-0245"},"institutions":[{"id":"https://openalex.org/I76198965","display_name":"Friedrich Schiller University Jena","ror":"https://ror.org/05qpz1x62","country_code":"DE","type":"education","lineage":["https://openalex.org/I76198965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Udo Hahn","raw_affiliation_strings":["Jena University Language & Information Engineering (JULIE) Lab Friedrich-Schiller-Universitt Jena, Jena, Germany"],"affiliations":[{"raw_affiliation_string":"Jena University Language & Information Engineering (JULIE) Lab Friedrich-Schiller-Universitt Jena, Jena, Germany","institution_ids":["https://openalex.org/I76198965"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052797822"],"corresponding_institution_ids":["https://openalex.org/I4210166741","https://openalex.org/I76198965"],"apc_list":null,"apc_paid":null,"fwci":1.1576,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.84753419,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"259","last_page":"269"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11800","display_name":"User Authentication and Security Systems","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.8500118255615234},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7455228567123413},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.7007524371147156},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6530886292457581},{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.6270990371704102},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4196198582649231},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.40311357378959656},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3638682961463928},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3410422205924988},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1067514717578888},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08174866437911987}],"concepts":[{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.8500118255615234},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7455228567123413},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.7007524371147156},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6530886292457581},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.6270990371704102},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4196198582649231},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.40311357378959656},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3638682961463928},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3410422205924988},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1067514717578888},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08174866437911987},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.26615/978-954-452-056-4_030","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_030","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.26615/978-954-452-056-4_030","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_030","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_030","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6700000166893005}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2989483391.pdf","grobid_xml":"https://content.openalex.org/works/W2989483391.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W8550301","https://openalex.org/W93415635","https://openalex.org/W128054572","https://openalex.org/W1034374084","https://openalex.org/W1262131959","https://openalex.org/W1603920809","https://openalex.org/W1836961878","https://openalex.org/W1966343454","https://openalex.org/W2053154970","https://openalex.org/W2115792042","https://openalex.org/W2137377614","https://openalex.org/W2155652813","https://openalex.org/W2159024459","https://openalex.org/W2160987310","https://openalex.org/W2166443682","https://openalex.org/W2190333735","https://openalex.org/W2268112550","https://openalex.org/W2294303695","https://openalex.org/W2295265695","https://openalex.org/W2517394750","https://openalex.org/W2578865663","https://openalex.org/W2621075239","https://openalex.org/W2624380710","https://openalex.org/W2758480492","https://openalex.org/W2889507104","https://openalex.org/W2893405045","https://openalex.org/W2950551677","https://openalex.org/W2963879260","https://openalex.org/W2963956191","https://openalex.org/W2964217136","https://openalex.org/W2991314401","https://openalex.org/W3099138433","https://openalex.org/W3122733836"],"related_works":["https://openalex.org/W2315527029","https://openalex.org/W2065387230","https://openalex.org/W2323937687","https://openalex.org/W648995381","https://openalex.org/W3033791384","https://openalex.org/W2141885522","https://openalex.org/W2776312268","https://openalex.org/W4246315097","https://openalex.org/W346029495","https://openalex.org/W1201259214"],"abstract_inverted_index":{"We":[0,67],"deal":[1],"with":[2],"the":[3],"pseudonymization":[4],"of":[5,8,35],"those":[6],"stretches":[7],"text":[9],"in":[10],"emails":[11],"that":[12],"might":[13],"allow":[14],"to":[15],"identify":[16],"real":[17],"individual":[18],"persons.":[19],"This":[20],"task":[21],"is":[22,62],"decomposed":[23],"into":[24],"two":[25],"steps.":[26],"First,":[27],"named":[28,59],"entities":[29,48],"carrying":[30],"privacysensitive":[31],"information":[32],"(e.g.,":[33,55],"names":[34],"persons,":[36],"locations,":[37],"phone":[38],"numbers":[39],"or":[40],"dates)":[41],"are":[42,49],"identified,":[43],"and,":[44],"second,":[45],"these":[46],"privacybearing":[47],"replaced":[50],"by":[51],"synthetically":[52],"generated":[53],"surrogates":[54],"a":[56,69,81],"person":[57],"originally":[58],"'John":[60],"Doe'":[61],"renamed":[63],"as":[64],"'Bill":[65],"Powers').":[66],"describe":[68],"system":[70],"architecture":[71],"for":[72],"surrogate":[73],"generation":[74],"and":[75],"evaluate":[76],"our":[77],"approach":[78],"on":[79],"CODEALLTAG,":[80],"German":[82],"email":[83],"corpus.":[84]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":6},{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2019-11-22T00:00:00"}
