{"id":"https://openalex.org/W2068004116","doi":"https://doi.org/10.1109/icassp.2013.6639168","title":"Compensation for inter-frame correlations in speaker diarization and recognition","display_name":"Compensation for inter-frame correlations in speaker diarization and recognition","publication_year":2013,"publication_date":"2013-05-01","ids":{"openalex":"https://openalex.org/W2068004116","doi":"https://doi.org/10.1109/icassp.2013.6639168","mag":"2068004116"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2013.6639168","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639168","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061939508","display_name":"Themos Stafylakis","orcid":"https://orcid.org/0000-0002-9227-3588"},"institutions":[{"id":"https://openalex.org/I4210111842","display_name":"Computer Research Institute of Montr\u00e9al","ror":"https://ror.org/0279d5115","country_code":"CA","type":"nonprofit","lineage":["https://openalex.org/I4210111842"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Themos Stafylakis","raw_affiliation_strings":["Centre de recherche informatique de Montreal, Montreal, QC, CA","Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre de recherche informatique de Montreal, Montreal, QC, CA","institution_ids":["https://openalex.org/I4210111842"]},{"raw_affiliation_string":"Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada","institution_ids":["https://openalex.org/I4210111842"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036466893","display_name":"Patrick Kenny","orcid":null},"institutions":[{"id":"https://openalex.org/I4210111842","display_name":"Computer Research Institute of Montr\u00e9al","ror":"https://ror.org/0279d5115","country_code":"CA","type":"nonprofit","lineage":["https://openalex.org/I4210111842"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Patrick Kenny","raw_affiliation_strings":["Centre de Recherche Informatique de Montreal, Canada","Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre de Recherche Informatique de Montreal, Canada","institution_ids":["https://openalex.org/I4210111842"]},{"raw_affiliation_string":"Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada","institution_ids":["https://openalex.org/I4210111842"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114009216","display_name":"Vishwa Gupta","orcid":null},"institutions":[{"id":"https://openalex.org/I4210111842","display_name":"Computer Research Institute of Montr\u00e9al","ror":"https://ror.org/0279d5115","country_code":"CA","type":"nonprofit","lineage":["https://openalex.org/I4210111842"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Vishwa Gupta","raw_affiliation_strings":["Centre de Recherche Informatique de Montreal, Canada","Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre de Recherche Informatique de Montreal, Canada","institution_ids":["https://openalex.org/I4210111842"]},{"raw_affiliation_string":"Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada","institution_ids":["https://openalex.org/I4210111842"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034083532","display_name":"Pierre Dumouchel","orcid":"https://orcid.org/0000-0001-5584-4428"},"institutions":[{"id":"https://openalex.org/I4210111842","display_name":"Computer Research Institute of Montr\u00e9al","ror":"https://ror.org/0279d5115","country_code":"CA","type":"nonprofit","lineage":["https://openalex.org/I4210111842"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Pierre Dumouchel","raw_affiliation_strings":["Centre de recherche informatique de Montreal, Montreal, QC, CA","Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre de recherche informatique de Montreal, Montreal, QC, CA","institution_ids":["https://openalex.org/I4210111842"]},{"raw_affiliation_string":"Centre de Rech. Inf. de Montreal (CRIM), Montreal, QC, Canada","institution_ids":["https://openalex.org/I4210111842"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210111842"],"apc_list":null,"apc_paid":null,"fwci":1.9774,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.886796,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"7731","last_page":"7735"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.7899186611175537},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.7868616580963135},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6843020915985107},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6327489614486694},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.6229999661445618},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.577529788017273},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.49443650245666504},{"id":"https://openalex.org/keywords/sample-size-determination","display_name":"Sample size determination","score":0.4887516498565674},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48433196544647217},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4768979549407959},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45745837688446045},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.4437435567378998},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.43907594680786133},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.43716636300086975},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42334532737731934},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.21337378025054932},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1749494969844818}],"concepts":[{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.7899186611175537},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.7868616580963135},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6843020915985107},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6327489614486694},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6229999661445618},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.577529788017273},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.49443650245666504},{"id":"https://openalex.org/C129848803","wikidata":"https://www.wikidata.org/wiki/Q2564360","display_name":"Sample size determination","level":2,"score":0.4887516498565674},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48433196544647217},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4768979549407959},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45745837688446045},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.4437435567378998},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.43907594680786133},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.43716636300086975},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42334532737731934},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.21337378025054932},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1749494969844818},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2013.6639168","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639168","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:espace2.etsmtl.ca:6017","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306402392","display_name":"Espace \u00c9TS (ETS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1341030882","host_organization_name":"Educational Testing Service","host_organization_lineage":["https://openalex.org/I1341030882"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Compte rendu de conf\u00e9rence"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W72302491","https://openalex.org/W106647055","https://openalex.org/W1482605500","https://openalex.org/W2064364374","https://openalex.org/W2090968725","https://openalex.org/W2096849680","https://openalex.org/W2129161539","https://openalex.org/W2140046090","https://openalex.org/W2150769028","https://openalex.org/W2157299333","https://openalex.org/W2168175751","https://openalex.org/W2395750323","https://openalex.org/W2397474108","https://openalex.org/W2400584454","https://openalex.org/W2401594978","https://openalex.org/W2972891548","https://openalex.org/W6628911050","https://openalex.org/W6674608193"],"related_works":["https://openalex.org/W2118039276","https://openalex.org/W2206035908","https://openalex.org/W2162158162","https://openalex.org/W4247736853","https://openalex.org/W1493012537","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W2696990509","https://openalex.org/W1999004162"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"introduce":[4],"the":[5,8,20,23,45,51,62,69,74,88,109],"concept":[6],"of":[7,22,54,57,65],"effective":[9,46,89],"sample":[10,25,47,52,90],"size":[11,26,53,91],"to":[12,29,114],"speaker":[13,83,121],"diarization":[14,84],"and":[15,36,72,103,106,131],"recognition.":[16],"We":[17,42],"show":[18,85],"why":[19],"use":[21],"nominal":[24],"is":[27,50,92,112],"inadequate":[28],"feature":[30],"streams":[31],"that":[32,49,60,86],"exhibit":[33],"inter-frame":[34],"correlations":[35],"how":[37,73],"it":[38],"adversely":[39],"affects":[40],"inference.":[41],"then":[43],"discuss":[44],"size,":[48],"a":[55],"set":[56,113],"independent":[58],"observations":[59],"carry":[61],"equivalent":[63],"amount":[64],"statistical":[66],"information":[67],"about":[68],"model":[70],"parameters":[71],"scaling":[75,110],"factor":[76,111],"can":[77,96],"be":[78,97,115],"estimated.":[79],"Our":[80],"experiments":[81],"on":[82,127],"once":[87],"adopted,":[93],"state-of-the-art":[94],"results":[95,124],"attained":[98],"even":[99,107],"with":[100],"single":[101],"Gaussians":[102],"Hierarchical":[104],"Clustering,":[105],"when":[108],"common":[116],"for":[117],"all":[118],"utterances.":[119],"On":[120],"recognition,":[122],"encouraging":[123],"are":[125],"reported":[126],"NIST-2010":[128],"using":[129],"iVectors":[130],"PLDA.":[132]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":3}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
