{"id":"https://openalex.org/W2963127219","doi":"https://doi.org/10.21437/odyssey.2018-27","title":"A Spoofing Benchmark for the 2018 Voice Conversion Challenge: Leveraging from Spoofing Countermeasures for Speech Artifact Assessment","display_name":"A Spoofing Benchmark for the 2018 Voice Conversion Challenge: Leveraging from Spoofing Countermeasures for Speech Artifact Assessment","publication_year":2018,"publication_date":"2018-06-06","ids":{"openalex":"https://openalex.org/W2963127219","doi":"https://doi.org/10.21437/odyssey.2018-27","mag":"2963127219"},"language":"en","primary_location":{"id":"doi:10.21437/odyssey.2018-27","is_oa":false,"landing_page_url":"https://doi.org/10.21437/odyssey.2018-27","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2018)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.research.ed.ac.uk/en/publications/992a42bf-5fac-444d-b5ac-19098cd93558","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043168931","display_name":"Tomi Kinnunen","orcid":"https://orcid.org/0000-0002-4371-7322"},"institutions":[{"id":"https://openalex.org/I175532246","display_name":"University of Eastern Finland","ror":"https://ror.org/00cyydd11","country_code":"FI","type":"education","lineage":["https://openalex.org/I175532246"]}],"countries":["FI"],"is_corresponding":true,"raw_author_name":"Tomi Kinnunen","raw_affiliation_strings":["University of Eastern Finland, Joensuu, Finland"],"affiliations":[{"raw_affiliation_string":"University of Eastern Finland, Joensuu, Finland","institution_ids":["https://openalex.org/I175532246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019530089","display_name":"Jaime Lorenzo-Trueba","orcid":"https://orcid.org/0000-0003-0459-1429"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jaime Lorenzo-Trueba","raw_affiliation_strings":["National Institute of Informatics, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"National Institute of Informatics, Tokyo, Japan","institution_ids":["https://openalex.org/I184597095"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007639385","display_name":"Junichi Yamagishi","orcid":"https://orcid.org/0000-0003-2752-3955"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]},{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB","JP"],"is_corresponding":false,"raw_author_name":"Junichi Yamagishi","raw_affiliation_strings":["University of Edinburgh, UK","National Institute of Informatics, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"National Institute of Informatics, Tokyo, Japan","institution_ids":["https://openalex.org/I184597095"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078330211","display_name":"Tomoki Toda","orcid":"https://orcid.org/0000-0001-8146-1279"},"institutions":[{"id":"https://openalex.org/I60134161","display_name":"Nagoya University","ror":"https://ror.org/04chrp450","country_code":"JP","type":"education","lineage":["https://openalex.org/I60134161"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomoki Toda","raw_affiliation_strings":["Nagoya University, Nagoya, Japan"],"affiliations":[{"raw_affiliation_string":"Nagoya University, Nagoya, Japan","institution_ids":["https://openalex.org/I60134161"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010841595","display_name":"Daisuke Saito","orcid":"https://orcid.org/0000-0003-3200-579X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Daisuke Saito","raw_affiliation_strings":["University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020219878","display_name":"Fernando Villavicencio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fernando Villavicencio","raw_affiliation_strings":["ObEN, Pasadena, USA"],"affiliations":[{"raw_affiliation_string":"ObEN, Pasadena, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059767940","display_name":"Zhen-Hua Ling","orcid":"https://orcid.org/0000-0001-7853-5273"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenhua Ling","raw_affiliation_strings":["University of Science and Technology of China, Heifei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Heifei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5043168931"],"corresponding_institution_ids":["https://openalex.org/I175532246"],"apc_list":null,"apc_paid":null,"fwci":2.8768,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.92974912,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"187","last_page":"194"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9767000079154968,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spoofing-attack","display_name":"Spoofing attack","score":0.925148606300354},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7480294108390808},{"id":"https://openalex.org/keywords/artifact","display_name":"Artifact (error)","score":0.7387393712997437},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6702390909194946},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5547211170196533},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.2988279461860657},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28892791271209717}],"concepts":[{"id":"https://openalex.org/C167900197","wikidata":"https://www.wikidata.org/wiki/Q11081100","display_name":"Spoofing attack","level":2,"score":0.925148606300354},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7480294108390808},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.7387393712997437},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6702390909194946},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5547211170196533},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2988279461860657},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28892791271209717},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/odyssey.2018-27","is_oa":false,"landing_page_url":"https://doi.org/10.21437/odyssey.2018-27","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2018)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:openaire/992a42bf-5fac-444d-b5ac-19098cd93558","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/992a42bf-5fac-444d-b5ac-19098cd93558","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Kinnunen, T, Lorenzo-Trueba, J, Yamagishi, J, Toda, T, Saito, D, Villavicencio, F & Ling, Z 2018, A Spoofing Benchmark for the 2018 Voice Conversion Challenge: Leveraging from Spoofing Countermeasures for Speech Artifact Assessment. in Speaker Odyssey 2018 : The Speaker and Language Recognition Workshop. Les Sables d'Olonne, France, pp. 187-194, The Speaker and Language Recognition Workshop, Les Sables d\u2019Olonne, France, 26/06/18. https://doi.org/10.21437/Odyssey.2018-27","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:pure.ed.ac.uk:openaire/992a42bf-5fac-444d-b5ac-19098cd93558","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/992a42bf-5fac-444d-b5ac-19098cd93558","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Kinnunen, T, Lorenzo-Trueba, J, Yamagishi, J, Toda, T, Saito, D, Villavicencio, F & Ling, Z 2018, A Spoofing Benchmark for the 2018 Voice Conversion Challenge: Leveraging from Spoofing Countermeasures for Speech Artifact Assessment. in Speaker Odyssey 2018 : The Speaker and Language Recognition Workshop. Les Sables d'Olonne, France, pp. 187-194, The Speaker and Language Recognition Workshop, Les Sables d\u2019Olonne, France, 26/06/18. https://doi.org/10.21437/Odyssey.2018-27","raw_type":"contributionToPeriodical"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2047346462","https://openalex.org/W2086381917","https://openalex.org/W2100649345","https://openalex.org/W2101587318","https://openalex.org/W2120605154","https://openalex.org/W2123299109","https://openalex.org/W2128466129","https://openalex.org/W2133420453","https://openalex.org/W2295634712","https://openalex.org/W2297648422","https://openalex.org/W2303197844","https://openalex.org/W2407170210","https://openalex.org/W2473388484","https://openalex.org/W2519091744","https://openalex.org/W2564082391","https://openalex.org/W2565961899","https://openalex.org/W2576309025","https://openalex.org/W2588445447","https://openalex.org/W2604812030","https://openalex.org/W2739735615","https://openalex.org/W2746474733","https://openalex.org/W2747024632","https://openalex.org/W2756766252","https://openalex.org/W2963035245"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2998478967","https://openalex.org/W2188559950","https://openalex.org/W2989910292","https://openalex.org/W3128793638","https://openalex.org/W2123299109","https://openalex.org/W2021230337","https://openalex.org/W2895823926","https://openalex.org/W2972676112"],"abstract_inverted_index":{"Voice":[0,126],"conversion":[1,5],"(VC)":[2],"aims":[3],"at":[4],"of":[6,34,60,143,150,156,170,190,212,215],"speaker":[7,26,40,83],"characteristic":[8],"without":[9,28],"altering":[10],"content.":[11],"Due":[12],"to":[13,23,113,120,139,226],"training":[14],"data":[15],"limitations":[16],"and":[17,42,53,182,223],"modeling":[18],"imperfections,":[19],"it":[20,56],"is":[21,195],"difficult":[22],"achieve":[24],"believable":[25],"mimicry":[27],"introducing":[29],"processing":[30,144],"artifacts;":[31],"performance":[32],"assessment":[33,67,107],"VC,":[35],"therefore,":[36],"usually":[37],"involves":[38],"both":[39],"similarity":[41],"quality":[43,184],"evaluation":[44],"by":[45],"a":[46,50,118,133,153,220],"human":[47,161],"panel.":[48],"As":[49,117],"time-consuming,":[51],"expensive,":[52],"non-reproducible":[54],"process,":[55],"hinders":[57],"rapid":[58],"prototyping":[59],"new":[61],"VC":[62,157,228],"technology.":[63,229],"We":[64],"address":[65],"artifact":[66,106,166],"using":[68],"an":[69],"alternative,":[70],"objective":[71],"approach":[72],"leveraging":[73],"from":[74],"prior":[75],"work":[76],"on":[77],"spoofing":[78],"countermeasures":[79],"(CMs)":[80],"for":[81,89,103,123],"automatic":[82,104],"verification.":[84],"Therein,":[85],"CMs":[86,213],"are":[87,173],"used":[88],"rejecting":[90],"\u2018fake\u2019":[91],"inputs":[92],"such":[93],"as":[94,164,219],"replayed,":[95],"synthetic":[96],"or":[97],"converted":[98],"speech":[99,105],"but":[100],"their":[101,216],"potential":[102,211],"remains":[108],"unknown.":[109],"This":[110],"study":[111],"serves":[112,163],"fill":[114],"that":[115],"gap.":[116],"supplement":[119],"subjective":[121],"results":[122],"the":[124,141,151,191],"2018":[125],"Conversion":[127],"Challenge":[128],"(VCC\u201918)":[129],"data,":[130],"we":[131],"configure":[132],"standard":[134],"constant-Q":[135],"cepstral":[136],"coefficient":[137],"CM":[138],"quantify":[140],"extent":[142],"artifacts.":[145,188],"Equal":[146],"error":[147],"rate":[148],"(EER)":[149],"CM,":[152],"confusability":[154],"index":[155],"samples":[158],"with":[159,177,186],"real":[160],"speech,":[162],"our":[165],"measure.":[167],"Two":[168],"clusters":[169],"VCC\u201918":[171,192],"entries":[172],"identified:":[174],"low-quality":[175],"ones":[176,185],"detectable":[178],"artifacts":[179],"(low":[180],"EERs),":[181],"higher":[183],"less":[187],"None":[189],"systems,":[193],"however,":[194],"perfect:":[196],"all":[197],"EERs":[198],"are&lt;":[199],"30%":[200],"(the":[201],"\u2018ideal\u2019":[202],"value":[203],"would":[204],"be":[205],"50%).":[206],"Our":[207],"preliminary":[208],"findings":[209],"suggest":[210],"outside":[214],"original":[217],"application,":[218],"supplemental":[221],"optimization":[222],"benchmarking":[224],"tool":[225],"enhance":[227]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":4}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
