{"id":"https://openalex.org/W4399485371","doi":"https://doi.org/10.1109/taslp.2024.3407600","title":"Distinctive and Natural Speaker Anonymization via Singular Value Transformation-Assisted Matrix","display_name":"Distinctive and Natural Speaker Anonymization via Singular Value Transformation-Assisted Matrix","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4399485371","doi":"https://doi.org/10.1109/taslp.2024.3407600"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3407600","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3407600","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015560758","display_name":"Jixun Yao","orcid":"https://orcid.org/0000-0002-5324-7360"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jixun Yao","raw_affiliation_strings":["Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0002-5324-7360","affiliations":[{"raw_affiliation_string":"Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107808955","display_name":"Qing Wang","orcid":"https://orcid.org/0009-0008-5449-4815"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Wang","raw_affiliation_strings":["Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0009-0008-5449-4815","affiliations":[{"raw_affiliation_string":"Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101783173","display_name":"Pengcheng Guo","orcid":"https://orcid.org/0009-0001-2388-5935"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengcheng Guo","raw_affiliation_strings":["Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0009-0001-2388-5935","affiliations":[{"raw_affiliation_string":"Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081164682","display_name":"Ziqian Ning","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqian Ning","raw_affiliation_strings":["Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100668966","display_name":"Lei Xie","orcid":"https://orcid.org/0000-0001-8234-0823"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Xie","raw_affiliation_strings":["Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0001-8234-0823","affiliations":[{"raw_affiliation_string":"Audio, Speech and Langauge Processing Group (ASLP@NPU), School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.0547,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.92268773,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"32","issue":null,"first_page":"2944","last_page":"2956"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9639999866485596,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9495000243186951,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.6614549160003662},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.5845797061920166},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.56292325258255},{"id":"https://openalex.org/keywords/singular-value","display_name":"Singular value","score":0.5494503378868103},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.5449293255805969},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4266301989555359},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3577958345413208},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1311747431755066},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.08531588315963745},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.08465337753295898},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.08346334099769592},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.07207304239273071}],"concepts":[{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.6614549160003662},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.5845797061920166},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.56292325258255},{"id":"https://openalex.org/C109282560","wikidata":"https://www.wikidata.org/wiki/Q4166054","display_name":"Singular value","level":3,"score":0.5494503378868103},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.5449293255805969},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4266301989555359},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3577958345413208},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1311747431755066},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.08531588315963745},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.08465337753295898},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.08346334099769592},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07207304239273071},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2024.3407600","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3407600","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W123034841","https://openalex.org/W1494198834","https://openalex.org/W1574447377","https://openalex.org/W2033178790","https://openalex.org/W2115098197","https://openalex.org/W2144005487","https://openalex.org/W2165806037","https://openalex.org/W2402146185","https://openalex.org/W2612348557","https://openalex.org/W2746498480","https://openalex.org/W2801581493","https://openalex.org/W2808631503","https://openalex.org/W2890964092","https://openalex.org/W2898564584","https://openalex.org/W2954217241","https://openalex.org/W2972359262","https://openalex.org/W2972848589","https://openalex.org/W2972908178","https://openalex.org/W3024768724","https://openalex.org/W3024869864","https://openalex.org/W3043999252","https://openalex.org/W3081871358","https://openalex.org/W3096424617","https://openalex.org/W3097777922","https://openalex.org/W3142516134","https://openalex.org/W3143465836","https://openalex.org/W3180600971","https://openalex.org/W3197008493","https://openalex.org/W3201497420","https://openalex.org/W3209059054","https://openalex.org/W3210530853","https://openalex.org/W3212077957","https://openalex.org/W3216758611","https://openalex.org/W4206231964","https://openalex.org/W4210970267","https://openalex.org/W4221114270","https://openalex.org/W4221152846","https://openalex.org/W4224916568","https://openalex.org/W4281250109","https://openalex.org/W4296069300","https://openalex.org/W4306867200","https://openalex.org/W4319862433","https://openalex.org/W4372260248","https://openalex.org/W4372267192","https://openalex.org/W4386557792","https://openalex.org/W6778823374","https://openalex.org/W6779459370","https://openalex.org/W6783867762","https://openalex.org/W6788095198","https://openalex.org/W6791179763","https://openalex.org/W6795807602","https://openalex.org/W6843253040","https://openalex.org/W6854199242","https://openalex.org/W6936113694"],"related_works":["https://openalex.org/W4283262748","https://openalex.org/W1997774067","https://openalex.org/W2353644209","https://openalex.org/W2593663830","https://openalex.org/W2348743188","https://openalex.org/W2902317490","https://openalex.org/W4387423451","https://openalex.org/W2502773048","https://openalex.org/W2025460258","https://openalex.org/W4287663927"],"abstract_inverted_index":{"Speaker":[0],"anonymization":[1,95],"is":[2,43,167,226],"an":[3,27,109,134],"effective":[4],"privacy":[5,72,245],"protection":[6],"solution":[7],"that":[8,97,225],"aims":[9],"to":[10,38,102,115,137],"conceal":[11,116],"speaker's":[12,160],"identity":[13,104,202,219],"while":[14,250],"preserving":[15],"the":[16,21,57,117,146,151,154,159,170,173,190,197,206,216,237],"naturalness":[17,253],"and":[18,70,81,86,105,132,142,178,211,229,254],"distinctiveness":[19,194],"of":[20,61,172,192,199,239],"original":[22,118],"speech.":[23],"Mainstream":[24],"approaches":[25],"use":[26],"utterance-level":[28],"vector":[29],"from":[30,54,127],"a":[31,92,99,128,139],"pre-trained":[32,129],"automatic":[33],"speaker":[34,40,66,94,103,119,125,193,218,244],"verification":[35],"(ASV)":[36],"model":[37,131],"represent":[39],"identity,":[41],"which":[42],"then":[44],"averaged":[45],"or":[46],"modified":[47],"for":[48,153],"anonymization.":[49],"However,":[50],"these":[51,79],"systems":[52],"suffer":[53],"deterioration":[55],"in":[56,65,242],"<italic":[58,67],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[59,68],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">naturalness</i>":[60],"anonymized":[62,88,110,217,223],"speech,":[63,89],"degradation":[64,191],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">distinctiveness</i>,":[69],"severe":[71],"leakage":[73],"against":[74],"powerful":[75],"attackers.":[76],"To":[77],"address":[78],"issues":[80],"especially":[82],"generate":[83,215],"more":[84],"natural":[85,228],"distinctive":[87],"we":[90,214],"propose":[91],"novel":[93],"approach":[96,122,241],"models":[98],"matrix":[100,114,141,148,166,177,210],"related":[101],"transforms":[106],"it":[107],"into":[108],"singular":[111,163,181,207],"value":[112,164,208],"transformation-assisted":[113,165,209],"identity.":[120,161],"Our":[121],"extracts":[123],"frame-level":[124],"vectors":[126],"ASV":[130],"employs":[133],"attention":[135],"mechanism":[136],"create":[138],"speaker-score":[140,147],"speaker-related":[143,156,212],"tokens.":[144],"Notably,":[145],"acts":[149],"as":[150],"weight":[152],"corresponding":[155],"token,":[157],"representing":[158],"The":[162],"generated":[168],"through":[169,182],"recomposition":[171],"decomposed":[174],"orthonormal":[175],"eigenvectors":[176],"non-linear":[179],"transformed":[180],"Singular":[183],"Value":[184],"Decomposition":[185],"(SVD).":[186],"This":[187],"process":[188],"prevents":[189],"caused":[195],"by":[196],"introduction":[198],"other":[200],"speakers'":[201],"information.":[203],"By":[204],"multiplying":[205],"tokens,":[213],"representation,":[220],"thereby":[221],"producing":[222],"speech":[224,252],"both":[227],"distinctive.":[230],"Experiments":[231],"on":[232],"VoicePrivacy":[233],"Challenge":[234],"datasets":[235],"demonstrate":[236],"effectiveness":[238],"our":[240],"protecting":[243],"under":[246],"all":[247],"attack":[248],"scenarios":[249],"maintaining":[251],"distinctiveness.":[255]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
