{"id":"https://openalex.org/W4312326706","doi":"https://doi.org/10.1109/dasc/picom/cbdcom/cy55231.2022.9927875","title":"Speaker Recognition using Multiple X-Vector Speaker Representations with Two-Stage Clustering and Outlier Detection Refinement","display_name":"Speaker Recognition using Multiple X-Vector Speaker Representations with Two-Stage Clustering and Outlier Detection Refinement","publication_year":2022,"publication_date":"2022-09-12","ids":{"openalex":"https://openalex.org/W4312326706","doi":"https://doi.org/10.1109/dasc/picom/cbdcom/cy55231.2022.9927875"},"language":"en","primary_location":{"id":"doi:10.1109/dasc/picom/cbdcom/cy55231.2022.9927875","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc/picom/cbdcom/cy55231.2022.9927875","pdf_url":null,"source":{"id":"https://openalex.org/S4363605495","display_name":"2022 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021596654","display_name":"Roman Shrestha","orcid":"https://orcid.org/0000-0002-7420-1329"},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Roman Shrestha","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044554092","display_name":"Cornelius Glackin","orcid":"https://orcid.org/0000-0001-5114-6403"},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Cornelius Glackin","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063632288","display_name":"Julie Wall","orcid":"https://orcid.org/0000-0001-6714-4867"},"institutions":[{"id":"https://openalex.org/I157227730","display_name":"University of East London","ror":"https://ror.org/057jrqr44","country_code":"GB","type":"education","lineage":["https://openalex.org/I157227730"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Julie Wall","raw_affiliation_strings":["University of East London,London,UK","University of East London, London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of East London,London,UK","institution_ids":["https://openalex.org/I157227730"]},{"raw_affiliation_string":"University of East London, London, UK","institution_ids":["https://openalex.org/I157227730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012466886","display_name":"Nigel Cannings","orcid":"https://orcid.org/0000-0002-5279-3968"},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nigel Cannings","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030887779","display_name":"Marvin Rajwadi","orcid":"https://orcid.org/0000-0002-5411-0489"},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marvin Rajwadi","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063811922","display_name":"Satya Kada","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Satya Kada","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021610847","display_name":"James Laird","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"James Laird","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065852886","display_name":"Thea Laird","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Thea Laird","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037676522","display_name":"Chris Woodruff","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chris Woodruff","raw_affiliation_strings":["Intelligent Voice Ltd.,London,UK","Intelligent Voice Ltd., London, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Voice Ltd.,London,UK","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Intelligent Voice Ltd., London, UK","institution_ids":["https://openalex.org/I4210153682"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5021596654"],"corresponding_institution_ids":["https://openalex.org/I4210153682"],"apc_list":null,"apc_paid":null,"fwci":0.1043,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.32337043,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7303752899169922},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7014800310134888},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6413155198097229},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.588676929473877},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.5786188840866089},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5628840923309326},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.5425137281417847},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5187528133392334},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.5165823698043823},{"id":"https://openalex.org/keywords/speaker-identification","display_name":"Speaker identification","score":0.5103492140769958},{"id":"https://openalex.org/keywords/stage","display_name":"Stage (stratigraphy)","score":0.4832633137702942},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4360736608505249},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.051979243755340576}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7303752899169922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7014800310134888},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6413155198097229},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.588676929473877},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.5786188840866089},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5628840923309326},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.5425137281417847},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5187528133392334},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.5165823698043823},{"id":"https://openalex.org/C2986627078","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker identification","level":3,"score":0.5103492140769958},{"id":"https://openalex.org/C146357865","wikidata":"https://www.wikidata.org/wiki/Q1123245","display_name":"Stage (stratigraphy)","level":2,"score":0.4832633137702942},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4360736608505249},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.051979243755340576},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/dasc/picom/cbdcom/cy55231.2022.9927875","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc/picom/cbdcom/cy55231.2022.9927875","pdf_url":null,"source":{"id":"https://openalex.org/S4363605495","display_name":"2022 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.uel.ac.uk:8qx05","is_oa":false,"landing_page_url":"https://doi.org/10.1109/DASC/PiCom/CBDCom/Cy55231.2022.9927875","pdf_url":null,"source":{"id":"https://openalex.org/S4306401301","display_name":"UEL Research Repository (University of East London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I157227730","host_organization_name":"University of East London","host_organization_lineage":["https://openalex.org/I157227730"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conference-paper"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W46948191","https://openalex.org/W1532958172","https://openalex.org/W2026358225","https://openalex.org/W2041823554","https://openalex.org/W2046056978","https://openalex.org/W2125336414","https://openalex.org/W2125642021","https://openalex.org/W2150769028","https://openalex.org/W2406312423","https://openalex.org/W2407374891","https://openalex.org/W2477779855","https://openalex.org/W2509346200","https://openalex.org/W2515851700","https://openalex.org/W2516631658","https://openalex.org/W2516764878","https://openalex.org/W2601243251","https://openalex.org/W2638067502","https://openalex.org/W2726515241","https://openalex.org/W2746574320","https://openalex.org/W2807305309","https://openalex.org/W2890964092","https://openalex.org/W2917534502","https://openalex.org/W2938358845","https://openalex.org/W2972449503","https://openalex.org/W2972961496","https://openalex.org/W2979593053","https://openalex.org/W3015503328","https://openalex.org/W3020336359","https://openalex.org/W3138445260","https://openalex.org/W3167533889","https://openalex.org/W3178462146","https://openalex.org/W3196595845","https://openalex.org/W3212414183","https://openalex.org/W4226220172","https://openalex.org/W4231743502","https://openalex.org/W6601908271","https://openalex.org/W6713727690","https://openalex.org/W6714259624","https://openalex.org/W6770919351","https://openalex.org/W6786127183","https://openalex.org/W6805819298"],"related_works":["https://openalex.org/W66821593","https://openalex.org/W36105149","https://openalex.org/W2545131480","https://openalex.org/W4401661962","https://openalex.org/W4247736853","https://openalex.org/W1521049138","https://openalex.org/W2144470400","https://openalex.org/W2997340161","https://openalex.org/W2911612049","https://openalex.org/W1964028329"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3],"novel":[4],"Variational":[5],"Bayes":[6],"x-vector":[7,20],"Voice":[8],"Print":[9],"Extraction":[10],"(VBxVPE)":[11],"system,":[12],"capable":[13],"of":[14,51,63,66,69,73,76,81,90,105,108,111,115,118,127],"capturing":[15],"vocal":[16],"variations":[17],"using":[18],"multiple":[19],"representations":[21],"with":[22,83,120],"two-stage":[23],"clustering":[24],"and":[25,32,47,86,93,101,123,130],"outlier":[26],"detection":[27],"for":[28],"robust":[29],"speaker":[30],"recognition":[31],"verification.":[33],"The":[34],"presented":[35],"approach":[36],"demonstrates":[37],"beyond":[38],"the":[39,45,52,55,97,134],"state-of-the-art":[40],"results":[41],"when":[42],"evaluated":[43],"against":[44],"\u2018core-core\u2019":[46,98],"\u2018core-multi\u2019":[48,135],"evaluation":[49,99,136],"conditions":[50],"Speakers":[53],"In":[54],"Wild":[56],"dataset,":[57],"achieving":[58],"an":[59],"Equal":[60,102],"Error":[61,103],"Rate":[62,104],"1.06%,":[64],"Cost":[65,72,107,114],"Detection":[67,74,109,116],"score":[68,75,88,110,117,125],"0.052,":[70],"minimum":[71,113],"0.010,":[77],"Speaker":[78],"Identification":[79],"Accuracy":[80],"95.84%":[82],"Precision,":[84,121],"Recall":[85,122],"F1":[87,124],"values":[89,126],"0.964,":[91],"0.958":[92],"0.961,":[94],"respectively":[95,132],"on":[96,133],"condition":[100],"1.07%,":[106],"0.066,":[112],"0.010":[119],"0.967,":[128],"0.963":[129],"0.965,":[131],"condition.":[137]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2023-01-04T00:00:00"}
