{"id":"https://openalex.org/W2072017324","doi":"https://doi.org/10.1109/icnc.2013.6817977","title":"Duration weighted Gaussian Mixture Model supervector modeling for robust speaker recognition","display_name":"Duration weighted Gaussian Mixture Model supervector modeling for robust speaker recognition","publication_year":2013,"publication_date":"2013-07-01","ids":{"openalex":"https://openalex.org/W2072017324","doi":"https://doi.org/10.1109/icnc.2013.6817977","mag":"2072017324"},"language":"en","primary_location":{"id":"doi:10.1109/icnc.2013.6817977","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnc.2013.6817977","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Ninth International Conference on Natural Computation (ICNC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029218568","display_name":"Zhe Ji","orcid":"https://orcid.org/0000-0002-1809-8099"},"institutions":[{"id":"https://openalex.org/I4210087772","display_name":"National Computer Network Emergency Response Technical Team/Coordination Center of Chinar","ror":"https://ror.org/00247dh76","country_code":"CN","type":"nonprofit","lineage":["https://openalex.org/I4210087772"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhe Ji","raw_affiliation_strings":["Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China"],"affiliations":[{"raw_affiliation_string":"Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","institution_ids":["https://openalex.org/I4210087772"]},{"raw_affiliation_string":"Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China","institution_ids":["https://openalex.org/I4210087772"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102005045","display_name":"Wei Hou","orcid":"https://orcid.org/0000-0002-1961-2184"},"institutions":[{"id":"https://openalex.org/I4210087772","display_name":"National Computer Network Emergency Response Technical Team/Coordination Center of Chinar","ror":"https://ror.org/00247dh76","country_code":"CN","type":"nonprofit","lineage":["https://openalex.org/I4210087772"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Hou","raw_affiliation_strings":["Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China"],"affiliations":[{"raw_affiliation_string":"Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","institution_ids":["https://openalex.org/I4210087772"]},{"raw_affiliation_string":"Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China","institution_ids":["https://openalex.org/I4210087772"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101882003","display_name":"Xin Jin","orcid":"https://orcid.org/0000-0001-7888-6954"},"institutions":[{"id":"https://openalex.org/I4210087772","display_name":"National Computer Network Emergency Response Technical Team/Coordination Center of Chinar","ror":"https://ror.org/00247dh76","country_code":"CN","type":"nonprofit","lineage":["https://openalex.org/I4210087772"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Jin","raw_affiliation_strings":["Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China"],"affiliations":[{"raw_affiliation_string":"Telecom Network Security Division, Technical Team Coordination Center of China (CNCERT/CC), Beijing, China","institution_ids":["https://openalex.org/I4210087772"]},{"raw_affiliation_string":"Telecom Network Security Division, National Computer network Emergency Response, technical Team Coordination Center of China (CNCERT/CC), Beijing, 100029, China","institution_ids":["https://openalex.org/I4210087772"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100779410","display_name":"Zhiyi Li","orcid":"https://orcid.org/0009-0000-6883-6101"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhi-Yi Li","raw_affiliation_strings":["Department of Electronic Engineering, Tsinghua University, Beijing, China","Department of Electronic Engineering, Tsinghua University,#N#Beijing  100084, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Department of Electronic Engineering, Tsinghua University,#N#Beijing  100084, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5029218568"],"corresponding_institution_ids":["https://openalex.org/I4210087772"],"apc_list":null,"apc_paid":null,"fwci":0.9618,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.82337926,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"10","issue":null,"first_page":"238","last_page":"241"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.7407223582267761},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.6751788258552551},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.662703275680542},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6589565277099609},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.5761563777923584},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.5734318494796753},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5057206153869629},{"id":"https://openalex.org/keywords/kullback\u2013leibler-divergence","display_name":"Kullback\u2013Leibler divergence","score":0.5048869252204895},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.49775341153144836},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4695141017436981},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4539492130279541},{"id":"https://openalex.org/keywords/duration","display_name":"Duration (music)","score":0.4430353343486786},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4069749712944031}],"concepts":[{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.7407223582267761},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.6751788258552551},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.662703275680542},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6589565277099609},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.5761563777923584},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.5734318494796753},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5057206153869629},{"id":"https://openalex.org/C171752962","wikidata":"https://www.wikidata.org/wiki/Q255166","display_name":"Kullback\u2013Leibler divergence","level":2,"score":0.5048869252204895},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.49775341153144836},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4695141017436981},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4539492130279541},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.4430353343486786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4069749712944031},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icnc.2013.6817977","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnc.2013.6817977","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Ninth International Conference on Natural Computation (ICNC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W63837534","https://openalex.org/W1571024744","https://openalex.org/W2041823554","https://openalex.org/W2144760012","https://openalex.org/W2154278880","https://openalex.org/W2183001115","https://openalex.org/W2397634864","https://openalex.org/W2403776763","https://openalex.org/W4239510810"],"related_works":["https://openalex.org/W1197719229","https://openalex.org/W2381158726","https://openalex.org/W1992796048","https://openalex.org/W2129090883","https://openalex.org/W2131049662","https://openalex.org/W1516392727","https://openalex.org/W2379906719","https://openalex.org/W2412815366","https://openalex.org/W2181956362","https://openalex.org/W2136153680"],"abstract_inverted_index":{"To":[0],"make":[1],"the":[2,31,36,65,121,125],"supervector":[3,23,62,75,128],"modeling":[4,24,129],"of":[5,39,82,91,108,136],"speech":[6,40,83],"utterance":[7,41],"more":[8],"effective":[9],"and":[10,58,100,110,133,141],"accurate,":[11],"this":[12,33,86],"paper":[13,87],"proposes":[14],"a":[15,45,72,89],"new":[16],"duration":[17,73,80],"weighted":[18],"Gaussian":[19],"Mixture":[20],"Model":[21,50],"(GMM)":[22],"method":[25,34,90,123],"for":[26,78],"robust":[27],"speaker":[28],"recognition.":[29],"At":[30],"beginning,":[32],"adapts":[35],"acoustic":[37],"features":[38],"to":[42,93],"GMM":[43,61,127],"from":[44],"common":[46],"basic":[47],"Universal":[48],"Background":[49],"(UBM)":[51],"with":[52,130],"Maximum":[53],"A":[54],"Posterior":[55],"(MAP)":[56],"criterion":[57],"then":[59],"models":[60],"by":[63],"bounding":[64],"Kullback-Leibler":[66],"(KL)":[67],"divergence":[68],"measure.":[69],"In":[70],"addition,":[71],"weight":[74],"is":[76],"modeled":[77],"using":[79],"information":[81],"utterances.":[84],"Furthermore,":[85],"presents":[88],"how":[92],"effectively":[94],"apply":[95],"them":[96],"together":[97],"during":[98],"training":[99],"classification.":[101],"Experimental":[102],"results":[103],"on":[104],"American":[105],"National":[106],"Institute":[107],"Standards":[109],"Technology":[111],"Speaker":[112],"Recognition":[113],"Evaluation":[114],"(NIST":[115],"SRE)":[116],"2008":[117],"dataset":[118],"demonstrate":[119],"that":[120],"proposed":[122],"outperforms":[124],"traditional":[126],"relative":[131],"16%":[132],"10%":[134],"improvements":[135],"Equal":[137],"Error":[138],"Rate":[139],"(EER)":[140],"Minimum":[142],"Detection":[143],"Cost":[144],"Function":[145],"(MinDCF),":[146],"respectively.":[147]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
