{"id":"https://openalex.org/W3048782751","doi":"https://doi.org/10.21437/interspeech.2020-2699","title":"Neural PLDA Modeling for End-to-End Speaker Verification","display_name":"Neural PLDA Modeling for End-to-End Speaker Verification","publication_year":2020,"publication_date":"2020-10-25","ids":{"openalex":"https://openalex.org/W3048782751","doi":"https://doi.org/10.21437/interspeech.2020-2699","mag":"3048782751"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2020-2699","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-2699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2008.04527","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113091984","display_name":"Shreyas Ramoji","orcid":null},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shreyas Ramoji","raw_affiliation_strings":["Indian Institute of Science Bangalore, Bengaluru, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Indian Institute of Science Bangalore, Bengaluru, India","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113921893","display_name":"Prashant Krishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Prashant Krishnan","raw_affiliation_strings":["Indian Institute of Science Bangalore, Bengaluru, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Indian Institute of Science Bangalore, Bengaluru, India","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002536077","display_name":"Sriram Ganapathy","orcid":"https://orcid.org/0000-0002-5779-9066"},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sriram Ganapathy","raw_affiliation_strings":["Indian Institute of Science"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Indian Institute of Science","institution_ids":["https://openalex.org/I59270414"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I59270414"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.09282481,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4333","last_page":"4337"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.8169683218002319},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7996293902397156},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7885346412658691},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.7156584858894348},{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.63114994764328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5533466339111328},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5225781202316284},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5131052732467651},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4911479651927948},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.471201628446579},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4680333435535431},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.42990565299987793}],"concepts":[{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.8169683218002319},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7996293902397156},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7885346412658691},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.7156584858894348},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.63114994764328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5533466339111328},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5225781202316284},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5131052732467651},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4911479651927948},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.471201628446579},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4680333435535431},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.42990565299987793},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.21437/interspeech.2020-2699","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-2699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.iisc.ac.in:67634","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401429","display_name":"ePrints@IISc (Indian Institute of Science)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I59270414","host_organization_name":"Indian Institute of Science Bangalore","host_organization_lineage":["https://openalex.org/I59270414"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"},{"id":"pmh:oai:arXiv.org:2008.04527","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.04527","pdf_url":"https://arxiv.org/pdf/2008.04527","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:3048782751","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/2008.04527.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2008.04527","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2008.04527","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2008.04527","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.04527","pdf_url":"https://arxiv.org/pdf/2008.04527","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7200000286102295,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3048782751.pdf","grobid_xml":"https://content.openalex.org/works/W3048782751.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1481604723","https://openalex.org/W1836183712","https://openalex.org/W1971758513","https://openalex.org/W1990942610","https://openalex.org/W2123768812","https://openalex.org/W2147147599","https://openalex.org/W2150769028","https://openalex.org/W2395750323","https://openalex.org/W2406312423","https://openalex.org/W2587150483","https://openalex.org/W2726515241","https://openalex.org/W2747238065","https://openalex.org/W2766245080","https://openalex.org/W2890964092","https://openalex.org/W2938358845","https://openalex.org/W2962788625","https://openalex.org/W2972327892","https://openalex.org/W2972606715","https://openalex.org/W2978904488","https://openalex.org/W2979593053","https://openalex.org/W3001061282","https://openalex.org/W3004892871","https://openalex.org/W3104056985"],"related_works":["https://openalex.org/W3097605294","https://openalex.org/W3104056985","https://openalex.org/W3001061282","https://openalex.org/W2053159670","https://openalex.org/W1968709559","https://openalex.org/W2053415153","https://openalex.org/W2394709239","https://openalex.org/W121563923","https://openalex.org/W2117881710","https://openalex.org/W2888742381","https://openalex.org/W2123768812","https://openalex.org/W2887833611","https://openalex.org/W3015596621","https://openalex.org/W284864749","https://openalex.org/W2011229062","https://openalex.org/W2070852568","https://openalex.org/W3156175260","https://openalex.org/W3172577958","https://openalex.org/W2999952536","https://openalex.org/W2586956420"],"abstract_inverted_index":{"While":[0],"deep":[1],"learning":[2],"models":[3,16],"have":[4],"made":[5],"significant":[6],"advances":[7],"in":[8,66,127],"supervised":[9],"classification":[10],"problems,":[11],"the":[12,52,70,75,80,92,96,117,124,140,151,155,163,176,183],"application":[13],"of":[14,79,95,116],"these":[15],"for":[17,50,63],"out-of-set":[18],"verification":[19,37,53,68,103,145,188],"tasks":[20],"like":[21],"speaker":[22,36,67,165,187],"recognition":[23,166],"has":[24],"been":[25],"limited":[26],"to":[27,112],"deriving":[28],"feature":[29],"embeddings.":[30],"The":[31],"state-of-the-art":[32],"x-vector":[33,184],"PLDA":[34,72,82,185],"based":[35,43],"systems":[38],"use":[39],"a":[40,59,87,102,144],"generative":[41,81],"model":[42,83,135,152,179],"on":[44],"probabilistic":[45],"linear":[46],"discriminant":[47],"analysis":[48],"(PLDA)":[49],"computing":[51],"score.":[54,158],"Recently,":[55],"we":[56,108,173],"had":[57],"proposed":[58,133,177],"neural":[60,71,119],"network":[61,120,126],"approach":[62],"backend":[64],"modeling":[65],"called":[69],"(NPLDA)":[73],"where":[74],"likelihood":[76,156],"ratio":[77,157],"score":[78,97],"is":[84,136],"posed":[85],"as":[86],"discriminative":[88],"similarity":[89],"function":[90,98,147],"and":[91,148,170],"learnable":[93],"parameters":[94],"are":[99],"optimized":[100,137],"using":[101,162],"cost.":[104],"In":[105],"this":[106,110],"paper,":[107],"extend":[109],"work":[111],"achieve":[113],"joint":[114],"optimization":[115],"embedding":[118],"(x-vector":[121],"network)":[122],"with":[123,143],"NPLDA":[125],"an":[128],"end-to-end":[129,134],"(E2E)":[130],"fashion.":[131],"This":[132],"directly":[138,153],"from":[139],"acoustic":[141],"features":[142],"cost":[146],"during":[149],"testing,":[150],"outputs":[154],"With":[159],"various":[160],"experiments":[161],"NIST":[164],"evaluation":[167],"(SRE)":[168],"2018":[169],"2019":[171],"datasets,":[172],"show":[174],"that":[175],"E2E":[178],"improves":[180],"significantly":[181],"over":[182],"baseline":[186],"system.":[189]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
