{"id":"https://openalex.org/W7162404241","doi":"https://doi.org/10.48550/arxiv.2605.25962","title":"Continual Speaker Identity Unlearning with Minimal Interference","display_name":"Continual Speaker Identity Unlearning with Minimal Interference","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162404241","doi":"https://doi.org/10.48550/arxiv.2605.25962"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.25962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.25962","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137055512","display_name":"Jinju Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Jinju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001893505","display_name":"Yunsung Kang","orcid":"https://orcid.org/0000-0002-4074-3138"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kang, Yunsung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136994520","display_name":"Gyeong-Moon Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Gyeong-Moon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5063908850","display_name":"Jong Hwan Ko","orcid":"https://orcid.org/0000-0003-4434-4318"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ko, Jong Hwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.6182000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.6182000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08250000327825546,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.0215000007301569,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.7770000100135803},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6583999991416931},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.5285999774932861},{"id":"https://openalex.org/keywords/interference","display_name":"Interference (communication)","score":0.49300000071525574},{"id":"https://openalex.org/keywords/linear-subspace","display_name":"Linear subspace","score":0.4832000136375427},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.32260000705718994}],"concepts":[{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.7770000100135803},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6583999991416931},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6236000061035156},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.5285999774932861},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.49300000071525574},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.4832000136375427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3752000033855438},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.35179999470710754},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3140999972820282},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.30090001225471497},{"id":"https://openalex.org/C2781162219","wikidata":"https://www.wikidata.org/wiki/Q26250693","display_name":"Replicate","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26089999079704285},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2581999897956848},{"id":"https://openalex.org/C175694140","wikidata":"https://www.wikidata.org/wiki/Q980329","display_name":"Orthographic projection","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.25962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.25962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6568925380706787}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Machine":[0],"unlearning":[1,19,43,65,79,98,128],"removes":[2],"designated":[3],"concepts":[4],"or":[5],"knowledge":[6],"from":[7],"pre-trained":[8],"models.":[9],"Recent":[10],"work":[11],"has":[12],"extended":[13],"this":[14,60],"paradigm":[15],"to":[16,32,82,105,117],"speaker":[17,68,96,107,136],"identity":[18,97],"in":[20,99],"zero-shot":[21],"text-to-speech":[22],"(ZS-TTS),":[23],"the":[24,75,91],"task":[25],"of":[26,151],"selectively":[27],"erasing":[28],"a":[29,34],"model's":[30],"ability":[31],"replicate":[33],"speaker's":[35],"voice.":[36],"Existing":[37],"methods,":[38],"however,":[39],"quietly":[40],"assume":[41],"all":[42],"requests":[44],"arrive":[45,54],"at":[46,158],"once;":[47],"an":[48],"unrealistic":[49],"assumption,":[50],"since":[51],"privacy-motivated":[52],"removals":[53],"sequentially":[55],"over":[56],"time.":[57],"We":[58,84],"show":[59],"assumption":[61],"breaks":[62],"state-of-the-art":[63],"methods:":[64],"each":[66,134],"new":[67],"fully":[69],"revives":[70],"previously":[71,139],"unlearned":[72,140],"speakers,":[73],"reintroducing":[74],"very":[76],"privacy":[77],"risk":[78],"was":[80],"meant":[81],"eliminate.":[83],"present":[85],"Cumulative":[86],"ORThogonal":[87],"Identity":[88],"Suppression":[89],"(CORTIS),":[90],"first":[92],"framework":[93],"for":[94],"continual":[95],"ZS-TTS":[100],"that":[101],"requires":[102],"no":[103],"access":[104],"previously-unlearned":[106],"data.":[108],"CORTIS":[109,132],"combines":[110],"Fisher-information-based":[111],"parameter":[112],"masking,":[113],"which":[114],"localizes":[115],"updates":[116],"speaker-relevant":[118],"weights,":[119],"with":[120],"orthogonal":[121],"projection":[122],"against":[123],"subspaces":[124],"spanned":[125],"by":[126],"prior":[127,152],"updates.":[129],"With":[130],"VoiceBox,":[131],"unlearns":[133],"requested":[135],"while":[137],"keeping":[138],"speakers":[141],"forgotten":[142],"across":[143],"long":[144],"request":[145],"sequences,":[146],"substantially":[147],"outperforming":[148],"sequential":[149],"application":[150],"methods.":[153],"The":[154],"demo":[155],"is":[156],"available":[157],"https://cumulativeortis.github.io/":[159],".":[160]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
