{"id":"https://openalex.org/W4406461995","doi":"https://doi.org/10.1109/slt61566.2024.10832292","title":"The Database and Benchmark For the Source Speaker Tracing Challenge 2024","display_name":"The Database and Benchmark For the Source Speaker Tracing Challenge 2024","publication_year":2024,"publication_date":"2024-12-02","ids":{"openalex":"https://openalex.org/W4406461995","doi":"https://doi.org/10.1109/slt61566.2024.10832292"},"language":"en","primary_location":{"id":"doi:10.1109/slt61566.2024.10832292","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832292","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100424650","display_name":"Ze Li","orcid":"https://orcid.org/0000-0003-1522-6187"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ze Li","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049403564","display_name":"Yuke Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuke Lin","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100387925","display_name":"Yao Tian","orcid":"https://orcid.org/0009-0002-3530-3944"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian Yao","raw_affiliation_strings":["OPPO,AI Center,Beijing,China"],"affiliations":[{"raw_affiliation_string":"OPPO,AI Center,Beijing,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109630497","display_name":"Hongbin Suo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongbin Suo","raw_affiliation_strings":["OPPO,AI Center,Beijing,China"],"affiliations":[{"raw_affiliation_string":"OPPO,AI Center,Beijing,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036446253","display_name":"Pengyuan Zhang","orcid":"https://orcid.org/0000-0001-6838-5160"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengyuan Zhang","raw_affiliation_strings":["Institute of Acoustics, CAS,Key Laboratory of Speech Acoustics and Content Understanding,China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics, CAS,Key Laboratory of Speech Acoustics and Content Understanding,China","institution_ids":["https://openalex.org/I4210099069"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101499462","display_name":"Yanzhen Ren","orcid":"https://orcid.org/0000-0003-0799-5082"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanzhen Ren","raw_affiliation_strings":["Wuhan University,Key Laboratory of Aerospace Information Security and Trusted Computing, Ministry of Education, School of Cyber Science and Engineering"],"affiliations":[{"raw_affiliation_string":"Wuhan University,Key Laboratory of Aerospace Information Security and Trusted Computing, Ministry of Education, School of Cyber Science and Engineering","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076833848","display_name":"Zexin Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zexin Cai","raw_affiliation_strings":["Johns Hopkins University,Center for Language and Speech Processing,USA"],"affiliations":[{"raw_affiliation_string":"Johns Hopkins University,Center for Language and Speech Processing,USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014342555","display_name":"Hiromitsu Nishizaki","orcid":"https://orcid.org/0000-0002-7717-8312"},"institutions":[{"id":"https://openalex.org/I44892455","display_name":"Takeda (Japan)","ror":"https://ror.org/04hjbmv12","country_code":"JP","type":"company","lineage":["https://openalex.org/I44892455"]},{"id":"https://openalex.org/I66906201","display_name":"University of Yamanashi","ror":"https://ror.org/059x21724","country_code":"JP","type":"education","lineage":["https://openalex.org/I66906201"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiromitsu Nishizaki","raw_affiliation_strings":["University of Yamanashi, 4-4-37, Takeda, Kofu,Integrated Graduate School of Medicine, Engineering, and Agricultural Sciences,Yamanashi,Japan,400-8510"],"affiliations":[{"raw_affiliation_string":"University of Yamanashi, 4-4-37, Takeda, Kofu,Integrated Graduate School of Medicine, Engineering, and Agricultural Sciences,Yamanashi,Japan,400-8510","institution_ids":["https://openalex.org/I66906201","https://openalex.org/I44892455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100351375","display_name":"Ming Li","orcid":"https://orcid.org/0000-0002-0722-028X"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Li","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5100424650"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.6891,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.77773521,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1254","last_page":"1261"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9749000072479248,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7769056558609009},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7639521956443787},{"id":"https://openalex.org/keywords/tracing","display_name":"Tracing","score":0.6702253818511963},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5783995389938354},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3342784643173218},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.22988569736480713},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.058709800243377686}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7769056558609009},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7639521956443787},{"id":"https://openalex.org/C138673069","wikidata":"https://www.wikidata.org/wiki/Q322229","display_name":"Tracing","level":2,"score":0.6702253818511963},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5783995389938354},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3342784643173218},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.22988569736480713},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.058709800243377686},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/slt61566.2024.10832292","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832292","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2123299109","https://openalex.org/W2168254078","https://openalex.org/W2176804518","https://openalex.org/W2194775991","https://openalex.org/W2219249508","https://openalex.org/W2248269543","https://openalex.org/W2696967604","https://openalex.org/W2726515241","https://openalex.org/W2745896134","https://openalex.org/W2808631503","https://openalex.org/W2890964092","https://openalex.org/W2936802426","https://openalex.org/W2967606780","https://openalex.org/W3010893827","https://openalex.org/W3024869864","https://openalex.org/W3083423753","https://openalex.org/W3101498587","https://openalex.org/W3163475957","https://openalex.org/W3165478005","https://openalex.org/W3197358873","https://openalex.org/W3197659778","https://openalex.org/W3197763626","https://openalex.org/W3202267900","https://openalex.org/W3209984917","https://openalex.org/W3213785244","https://openalex.org/W4221138880","https://openalex.org/W4221154745","https://openalex.org/W4320451749","https://openalex.org/W4372260053","https://openalex.org/W4372260476","https://openalex.org/W4375868976","https://openalex.org/W4378506723","https://openalex.org/W4385823240","https://openalex.org/W4385823264","https://openalex.org/W4385823375","https://openalex.org/W4385823432","https://openalex.org/W4385823472","https://openalex.org/W4392969497","https://openalex.org/W4400033122","https://openalex.org/W6688816777","https://openalex.org/W6746052068","https://openalex.org/W6782990278","https://openalex.org/W6802029025","https://openalex.org/W6802527329","https://openalex.org/W6805710207","https://openalex.org/W6843707108","https://openalex.org/W6849600165","https://openalex.org/W6852755086","https://openalex.org/W6856419980"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W4246352526"],"abstract_inverted_index":{"Voice":[0],"conversion":[1,97],"(VC)":[2],"systems":[3,83,135],"can":[4,143],"transform":[5],"audio":[6],"to":[7,49,111],"mimic":[8],"another":[9],"speaker\u2019s":[10],"voice,":[11],"thereby":[12],"attacking":[13],"speaker":[14,23],"verification":[15,24],"(SV)":[16],"systems.":[17],"However,":[18],"ongoing":[19],"studies":[20],"on":[21,44,85],"source":[22],"(SSV)":[25],"are":[26],"hindered":[27],"by":[28],"limited":[29],"data":[30],"availability":[31],"and":[32,56,77,123,130],"methodological":[33],"constraints.":[34],"This":[35],"paper":[36],"presents":[37],"the":[38,51,54,59,86,101,105,117,120,128],"Source":[39],"Speaker":[40],"Tracking":[41],"Challenge":[42],"(SSTC)":[43],"STL":[45],"2024,":[46],"which":[47],"aims":[48],"fill":[50],"gap":[52],"in":[53],"database":[55,71],"benchmark":[57],"for":[58,115],"SSV":[60,106,121],"task.":[61,107],"In":[62,89],"this":[63],"study,":[64],"we":[65,91],"generate":[66],"a":[67,79,93,113],"large-scale":[68],"converted":[69],"speech":[70],"with":[72,100],"16":[73],"common":[74],"VC":[75,137],"methods":[76],"train":[78],"batch":[80],"of":[81,103,119,132],"baseline":[82],"based":[84],"MFA-Conformer":[87],"architecture.":[88],"addition,":[90],"introduced":[92],"related":[94],"task":[95,122],"called":[96],"method":[98],"recognition,":[99],"aim":[102],"assisting":[104],"We":[108],"expect":[109],"SSTC":[110,142],"be":[112,144],"platform":[114],"advancing":[116],"development":[118],"provide":[124],"further":[125],"insights":[126],"into":[127],"performance":[129],"limitations":[131],"current":[133],"SV":[134],"against":[136],"attacks.":[138],"Further":[139],"details":[140],"about":[141],"found":[145],"here<sup":[146],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[147,149],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>.<sup":[148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>https://sstc-challenge.github.io/":[150]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
