{"id":"https://openalex.org/W7134113222","doi":"https://doi.org/10.1109/tifs.2026.3671687","title":"DUAP: Disentanglement-Based Universal Adversarial Perturbations for Robust Multilingual Speech Privacy Protection","display_name":"DUAP: Disentanglement-Based Universal Adversarial Perturbations for Robust Multilingual Speech Privacy Protection","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7134113222","doi":"https://doi.org/10.1109/tifs.2026.3671687"},"language":null,"primary_location":{"id":"doi:10.1109/tifs.2026.3671687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tifs.2026.3671687","pdf_url":null,"source":{"id":"https://openalex.org/S61310614","display_name":"IEEE Transactions on Information Forensics and Security","issn_l":"1556-6013","issn":["1556-6013","1556-6021"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Forensics and Security","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121072862","display_name":"Q. M. Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qianli Ma","raw_affiliation_strings":["College of Information Science and Engineering, Ningbo University, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ningbo University, Ningbo, China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128300679","display_name":"Wenjie Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjie Zhang","raw_affiliation_strings":["College of Information Science and Engineering, Ningbo University, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ningbo University, Ningbo, China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiahao Chen","orcid":"https://orcid.org/0000-0002-5894-662X"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiahao Chen","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114972002","display_name":"Jiazhen Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiazhen Jia","raw_affiliation_strings":["College of Information Science and Engineering, Ningbo University, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ningbo University, Ningbo, China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Rangding Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rangding Wang","raw_affiliation_strings":["College of Digital Technology and Engineering, Ningbo University of Finance and Economics, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"College of Digital Technology and Engineering, Ningbo University of Finance and Economics, Ningbo, China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016795475","display_name":"Diqun Yan","orcid":"https://orcid.org/0000-0002-5241-7276"},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Diqun Yan","raw_affiliation_strings":["College of Information Science and Engineering, Ningbo University, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ningbo University, Ningbo, China","institution_ids":["https://openalex.org/I109935558"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5121072862"],"corresponding_institution_ids":["https://openalex.org/I109935558"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54681067,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"21","issue":null,"first_page":"3703","last_page":"3718"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9049999713897705,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9049999713897705,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.025800000876188278,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.025299999862909317,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.8812999725341797},{"id":"https://openalex.org/keywords/transferability","display_name":"Transferability","score":0.6553999781608582},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.5144000053405762},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.428600013256073},{"id":"https://openalex.org/keywords/language-identification","display_name":"Language identification","score":0.39149999618530273},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.32510000467300415},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.31929999589920044},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.31850001215934753}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.8812999725341797},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8650000095367432},{"id":"https://openalex.org/C61272859","wikidata":"https://www.wikidata.org/wiki/Q7834031","display_name":"Transferability","level":3,"score":0.6553999781608582},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.5144000053405762},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4706000089645386},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.46630001068115234},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4372999966144562},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.428600013256073},{"id":"https://openalex.org/C129792486","wikidata":"https://www.wikidata.org/wiki/Q1050419","display_name":"Language identification","level":3,"score":0.39149999618530273},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.32510000467300415},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.31929999589920044},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.31779998540878296},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C3017597292","wikidata":"https://www.wikidata.org/wiki/Q25052250","display_name":"Privacy protection","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C2780035574","wikidata":"https://www.wikidata.org/wiki/Q30081","display_name":"Multilingualism","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2775999903678894},{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C153025619","wikidata":"https://www.wikidata.org/wiki/Q1051241","display_name":"Public address system","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tifs.2026.3671687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tifs.2026.3671687","pdf_url":null,"source":{"id":"https://openalex.org/S61310614","display_name":"IEEE Transactions on Information Forensics and Security","issn_l":"1556-6013","issn":["1556-6013","1556-6021"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Forensics and Security","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5107393264770508}],"awards":[{"id":"https://openalex.org/G2871147967","display_name":null,"funder_award_id":"62571283","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2873729387","display_name":null,"funder_award_id":"2024Z128","funder_id":"https://openalex.org/F4320336552","funder_display_name":"Science and Technology Innovation 2025 Major Project of Ningbo"},{"id":"https://openalex.org/G697824810","display_name":null,"funder_award_id":"62171244","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336552","display_name":"Science and Technology Innovation 2025 Major Project of Ningbo","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,152],"rapid":[1],"advancement":[2],"of":[3],"automatic":[4],"speech":[5,21,43],"recognition":[6,44],"(ASR)":[7],"models":[8],"has":[9],"significantly":[10],"bolstered":[11],"their":[12,79,94],"multilingual":[13,42,63,82,150],"proficiency":[14],"and":[15,33,144,166,191,219,231],"robustness,":[16],"amplifying":[17],"concerns":[18],"over":[19,213],"user":[20,36],"privacy.":[22],"Attackers":[23],"may":[24],"use":[25],"hidden":[26],"microphones":[27],"or":[28],"network":[29],"attacks":[30],"to":[31,62,96,117,133,170,180,200],"capture":[32],"transcribe":[34],"sensitive":[35],"interactions.":[37],"Whisper,":[38],"a":[39,113,155,160],"state-of-the-art":[40],"(SOTA)":[41],"model,":[45],"delivers":[46],"exceptional":[47],"transcription":[48],"accuracy":[49],"across":[50,141],"diverse":[51],"languages.":[52],"However,":[53],"its":[54],"superior":[55],"performance":[56],"also":[57],"extends":[58],"privacy":[59,147],"leakage":[60],"risks":[61,148],"contexts.":[64,151],"Previous":[65],"privacy-preserving":[66,114],"methods":[67],"based":[68],"on":[69],"adversarial":[70,136,172],"examples":[71,173],"were":[72,89],"primarily":[73],"optimized":[74],"for":[75,92],"monolingual":[76],"models,":[77],"limiting":[78],"effectiveness":[80],"in":[81,129,149,189],"settings.":[83],"Moreover,":[84],"as":[85],"these":[86],"perturbation":[87],"mechanisms":[88],"predominantly":[90],"tailored":[91],"English,":[93],"transferability":[95],"other":[97],"languages":[98,143],"remains":[99],"constrained.":[100],"To":[101],"address":[102],"this":[103],"vulnerability,":[104],"we":[105],"propose":[106],"the":[107,119,130],"Disentanglement-based":[108],"Universal":[109],"Adversarial":[110],"Perturbation":[111],"(DUAP),":[112],"method":[115,153],"designed":[116],"counteract":[118],"Whisper":[120,207],"model.":[121],"Unlike":[122],"optimization-based":[123],"approaches,":[124],"DUAP":[125,210],"embeds":[126],"language-specific":[127,168],"features":[128,169],"latent":[131],"space":[132],"generate":[134],"robust":[135],"perturbations,":[137,187],"providing":[138],"consistent":[139],"protection":[140],"multiple":[142],"effectively":[145],"mitigating":[146],"employs":[154],"two-stage":[156],"language":[157,183],"attack:":[158],"first,":[159],"Language":[161],"Feature":[162],"Disentanglement":[163],"model":[164,208],"disentangles":[165],"reconstructs":[167],"produce":[171],"(AEs);":[174],"second,":[175],"gradient-based":[176],"optimization":[177],"refines":[178],"AEs":[179],"disrupt":[181],"Whisper\u2019s":[182],"identification":[184],"module.":[185],"DUAP\u2019s":[186],"effective":[188],"physical":[190],"digital":[192],"settings,":[193],"achieve":[194],"SNRs":[195],"from":[196],"40":[197],"dB":[198,203],"(lightest)":[199],"above":[201,224],"17":[202],"(strongest).":[204],"Across":[205],"three":[206],"sizes,":[209],"yields":[211],"WERs":[212],"95%":[214],"(English),":[215],"85%":[216],"(other":[217],"languages),":[218],"87%":[220],"(physical":[221],"settings),":[222],"maintaining":[223],"96%":[225],"under":[226],"AAC":[227],"(64,":[228],"72":[229],"kbps)":[230,235],"MP3":[232],"(32,":[233],"96":[234],"compressions.":[236]},"counts_by_year":[],"updated_date":"2026-04-10T06:02:16.177343","created_date":"2026-03-08T00:00:00"}
