{"id":"https://openalex.org/W2944613371","doi":"https://doi.org/10.1109/iscslp.2018.8706575","title":"Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification","display_name":"Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2944613371","doi":"https://doi.org/10.1109/iscslp.2018.8706575","mag":"2944613371"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2018.8706575","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706575","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057050425","display_name":"Yexin Yang","orcid":"https://orcid.org/0000-0001-9597-9829"},"institutions":[{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yexin Yang","raw_affiliation_strings":["Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055716987","display_name":"Shuai Wang","orcid":"https://orcid.org/0000-0002-1796-7280"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Wang","raw_affiliation_strings":["Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103897732","display_name":"Man Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Man Sun","raw_affiliation_strings":["Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100341993","display_name":"Yanmin Qian","orcid":"https://orcid.org/0000-0002-0314-3790"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanmin Qian","raw_affiliation_strings":["Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043098653","display_name":"Kai Yu","orcid":"https://orcid.org/0000-0002-7102-9826"},"institutions":[{"id":"https://openalex.org/I4210165726","display_name":"Shanghai Municipal Education Commission","ror":"https://ror.org/05tewj457","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210165456","https://openalex.org/I4210165726"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Yu","raw_affiliation_strings":["Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Lab. of Shanghai Education Commission for Intelligent Interaction and Cognitive Engineering SpeechLab, Brain Science and Technology Research Center Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210165726","https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5057050425"],"corresponding_institution_ids":["https://openalex.org/I183067930","https://openalex.org/I4210165726"],"apc_list":null,"apc_paid":null,"fwci":1.466,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.8707721,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"205","last_page":"209"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7274941802024841},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7186291217803955},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.6955058574676514},{"id":"https://openalex.org/keywords/linear-discriminant-analysis","display_name":"Linear discriminant analysis","score":0.6193381547927856},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6052477359771729},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5508298873901367},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5504502058029175},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.5296280980110168},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4810098111629486},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4651993215084076},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.42924922704696655},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.35399875044822693},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18858987092971802}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7274941802024841},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7186291217803955},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.6955058574676514},{"id":"https://openalex.org/C69738355","wikidata":"https://www.wikidata.org/wiki/Q1228929","display_name":"Linear discriminant analysis","level":2,"score":0.6193381547927856},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6052477359771729},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5508298873901367},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5504502058029175},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.5296280980110168},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4810098111629486},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4651993215084076},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.42924922704696655},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.35399875044822693},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18858987092971802},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp.2018.8706575","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706575","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7400000095367432}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W577640895","https://openalex.org/W1006777433","https://openalex.org/W1524333225","https://openalex.org/W1589137271","https://openalex.org/W1999033484","https://openalex.org/W2046056978","https://openalex.org/W2059610484","https://openalex.org/W2099471712","https://openalex.org/W2121812409","https://openalex.org/W2125389028","https://openalex.org/W2147147599","https://openalex.org/W2150769028","https://openalex.org/W2154278880","https://openalex.org/W2160306971","https://openalex.org/W2160815625","https://openalex.org/W2163605009","https://openalex.org/W2173520492","https://openalex.org/W2293078015","https://openalex.org/W2294814385","https://openalex.org/W2360384684","https://openalex.org/W2404617565","https://openalex.org/W2405756170","https://openalex.org/W2406312423","https://openalex.org/W2488005896","https://openalex.org/W2666408839","https://openalex.org/W2696967604","https://openalex.org/W2738829388","https://openalex.org/W2739748921","https://openalex.org/W2748318213","https://openalex.org/W2748488820","https://openalex.org/W2770173563","https://openalex.org/W2888930363","https://openalex.org/W2888968865","https://openalex.org/W2890654588","https://openalex.org/W2890964092","https://openalex.org/W2891138528","https://openalex.org/W2949999304","https://openalex.org/W2962879692","https://openalex.org/W2963341071","https://openalex.org/W2963684088","https://openalex.org/W3099832538","https://openalex.org/W4295521014","https://openalex.org/W4320013936","https://openalex.org/W6631362777","https://openalex.org/W6635152626","https://openalex.org/W6678815747","https://openalex.org/W6684191040","https://openalex.org/W6685352114","https://openalex.org/W6713645886","https://openalex.org/W6713727690","https://openalex.org/W6735429107","https://openalex.org/W6735913928","https://openalex.org/W6741832134","https://openalex.org/W6746638498"],"related_works":["https://openalex.org/W2118039276","https://openalex.org/W2051274299","https://openalex.org/W468945283","https://openalex.org/W4235705411","https://openalex.org/W1521299571","https://openalex.org/W204267554","https://openalex.org/W2147062549","https://openalex.org/W2134501921","https://openalex.org/W4252590334","https://openalex.org/W2543777506"],"abstract_inverted_index":{"Data":[0],"augmentation":[1,33],"is":[2,42,64],"an":[3],"effective":[4],"method":[5],"to":[6,66,83],"increase":[7],"the":[8,15,75,87],"quantity":[9],"of":[10,54,108],"training":[11],"data,":[12],"which":[13,41],"improves":[14],"model's":[16],"robustness":[17],"and":[18,94,110,116],"generalization":[19],"ability.":[20],"In":[21],"this":[22,95],"paper,":[23],"we":[24],"propose":[25],"a":[26,43,60],"generative":[27],"adversarial":[28],"network":[29],"(GAN)":[30],"based":[31,49],"data":[32],"approach":[34],"for":[35,46,114],"probabilistic":[36],"linear":[37],"discriminant":[38],"analysis":[39],"(PLDA),":[40],"standard":[44,76],"back-end":[45],"state-of-the-art":[47],"x-vector":[48],"speaker":[50],"verification":[51],"system.":[52],"Instead":[53],"generating":[55],"new":[56],"spectral":[57],"feature":[58],"samples,":[59],"conditional":[61],"Wasserstein":[62],"GAN":[63,88],"adopted":[65],"directly":[67],"generate":[68],"x-vectors.":[69],"Experiments":[70],"are":[71],"carried":[72],"out":[73],"on":[74],"NIST":[77],"SRE":[78],"2016":[79],"evaluation":[80,118],"dataset.":[81],"Compared":[82],"manually":[84],"adding":[85],"noise,":[86],"augmented":[89,105],"PLDA":[90],"achieves":[91],"better":[92],"performance":[93,96],"can":[97],"be":[98],"further":[99],"boosted":[100],"when":[101],"combined":[102],"with":[103],"manual":[104],"data.":[106],"EER":[107],"11.68%":[109],"4.43%":[111],"were":[112],"obtained":[113],"Tagalog":[115],"Cantonese":[117],"condition,":[119],"respectively.":[120]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
