{"id":"https://openalex.org/W4408355022","doi":"https://doi.org/10.1109/icassp49660.2025.10890338","title":"Emotion-Preserving Prosody Anonymization Network for Voice Privacy Protection","display_name":"Emotion-Preserving Prosody Anonymization Network for Voice Privacy Protection","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355022","doi":"https://doi.org/10.1109/icassp49660.2025.10890338"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890338","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890338","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004010435","display_name":"Jiabei He","orcid":"https://orcid.org/0000-0003-1296-3675"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiabei He","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052465353","display_name":"Shiwan Zhao","orcid":"https://orcid.org/0000-0001-5068-025X"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiwan Zhao","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114859604","display_name":"Jiaming Zhou","orcid":"https://orcid.org/0009-0001-4760-9708"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaming Zhou","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035524175","display_name":"Haoqin Sun","orcid":"https://orcid.org/0000-0002-8554-8969"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoqin Sun","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100460850","display_name":"Hui Wang","orcid":"https://orcid.org/0000-0002-8814-1988"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Wang","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088716214","display_name":"Yong Qin","orcid":"https://orcid.org/0000-0002-6519-8316"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Qin","raw_affiliation_strings":["Nankai Unversity,TMCC, College of Computer Science,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"Nankai Unversity,TMCC, College of Computer Science,Tianjin,China","institution_ids":["https://openalex.org/I205237279"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5004010435"],"corresponding_institution_ids":["https://openalex.org/I205237279"],"apc_list":null,"apc_paid":null,"fwci":4.3637,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.93384064,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9609000086784363,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9609000086784363,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7106382846832275},{"id":"https://openalex.org/keywords/privacy-protection","display_name":"Privacy protection","score":0.6663911938667297},{"id":"https://openalex.org/keywords/prosody","display_name":"Prosody","score":0.5480818152427673},{"id":"https://openalex.org/keywords/internet-privacy","display_name":"Internet privacy","score":0.4754825830459595},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.44168925285339355},{"id":"https://openalex.org/keywords/information-privacy","display_name":"Information privacy","score":0.4308244585990906},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.42426756024360657}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7106382846832275},{"id":"https://openalex.org/C3017597292","wikidata":"https://www.wikidata.org/wiki/Q25052250","display_name":"Privacy protection","level":2,"score":0.6663911938667297},{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.5480818152427673},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.4754825830459595},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.44168925285339355},{"id":"https://openalex.org/C123201435","wikidata":"https://www.wikidata.org/wiki/Q456632","display_name":"Information privacy","level":2,"score":0.4308244585990906},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.42426756024360657}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890338","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890338","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.4699999988079071,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2146334809","https://openalex.org/W2202109488","https://openalex.org/W2593414223","https://openalex.org/W2785978752","https://openalex.org/W2889544410","https://openalex.org/W2962788625","https://openalex.org/W2963426391","https://openalex.org/W2972848589","https://openalex.org/W2995181338","https://openalex.org/W3010925296","https://openalex.org/W3024869864","https://openalex.org/W3096939667","https://openalex.org/W3160438760","https://openalex.org/W3167533889","https://openalex.org/W3197008493","https://openalex.org/W3209059054","https://openalex.org/W4372260248","https://openalex.org/W4375869316","https://openalex.org/W4386187689","https://openalex.org/W4392902635","https://openalex.org/W4392910591","https://openalex.org/W4406461271","https://openalex.org/W6687045409","https://openalex.org/W6780218876","https://openalex.org/W6796464841","https://openalex.org/W6848735303","https://openalex.org/W6855439139","https://openalex.org/W6862144568","https://openalex.org/W6863517579"],"related_works":["https://openalex.org/W2584827882","https://openalex.org/W3195097297","https://openalex.org/W3038106605","https://openalex.org/W2513267613","https://openalex.org/W3049084372","https://openalex.org/W2528109871","https://openalex.org/W2940702331","https://openalex.org/W2905822832","https://openalex.org/W4225340788","https://openalex.org/W4318485713"],"abstract_inverted_index":{"Balancing":[0],"emotion":[1,67],"preservation":[2],"and":[3,124,134],"privacy":[4,125],"protection":[5],"in":[6,25,31,131],"voice":[7,94],"anonymization":[8,84,114],"presents":[9],"a":[10,22,52,91],"significant":[11],"challenge,":[12],"particularly":[13],"due":[14],"to":[15,64,138],"the":[16,40,98,109,128,139],"difficulty":[17],"of":[18,42],"effectively":[19],"handling":[20],"prosody,":[21],"key":[23],"feature":[24],"speech.":[26],"While":[27],"preserving":[28],"prosodic":[29,62],"features":[30,63],"anonymized":[32],"speech":[33,66,87],"enhances":[34],"emotional":[35,120],"expression,":[36,121],"it":[37],"also":[38],"increases":[39],"risk":[41],"leaking":[43],"speaker":[44],"information.":[45],"To":[46],"address":[47],"this":[48],"conflict,":[49],"we":[50,89],"propose":[51],"lightweight":[53],"Emotion-Preserving":[54],"Prosody":[55],"Anonymization":[56],"(EPPA)":[57],"network,":[58],"which":[59],"extracts":[60],"speaker-independent":[61],"preserve":[65],"while":[68,85],"converting":[69],"them":[70],"into":[71],"another":[72],"speaker\u2019s":[73],"style":[74],"for":[75,83],"anonymization.":[76],"By":[77],"combining":[78],"EPPA":[79],"with":[80],"timbre":[81],"cloning":[82],"retaining":[86],"content,":[88],"achieve":[90],"more":[92],"balanced":[93],"conversion.":[95],"Evaluated":[96],"using":[97],"Voice":[99],"Privacy":[100],"Challenge":[101],"(VPC)":[102],"2024":[103],"metrics,":[104],"our":[105],"proposed":[106],"EPPA,":[107],"utilizing":[108],"closest":[110],"center":[111],"distance":[112],"(CCD)":[113],"strategy,":[115],"demonstrates":[116],"strong":[117],"performance":[118],"across":[119],"content":[122],"clarity,":[123],"protection,":[126],"achieving":[127],"highest":[129],"ranking":[130],"both":[132],"average":[133],"weighted":[135],"ranks":[136],"compared":[137],"six":[140],"baseline":[141],"solutions.":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
