{"id":"https://openalex.org/W2187387698","doi":"https://doi.org/10.21437/odyssey.2014-10","title":"Text-Independent Speaker Verification via State Alignment","display_name":"Text-Independent Speaker Verification via State Alignment","publication_year":2014,"publication_date":"2014-06-16","ids":{"openalex":"https://openalex.org/W2187387698","doi":"https://doi.org/10.21437/odyssey.2014-10","mag":"2187387698"},"language":"en","primary_location":{"id":"doi:10.21437/odyssey.2014-10","is_oa":false,"landing_page_url":"https://doi.org/10.21437/odyssey.2014-10","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2014)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100779405","display_name":"Zhiyi Li","orcid":"https://orcid.org/0000-0001-6407-2554"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhi-Yi Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100692904","display_name":"Wei-Qiang Zhang","orcid":"https://orcid.org/0000-0003-3841-1959"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei-Qiang Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100359534","display_name":"Weiwei Liu","orcid":"https://orcid.org/0000-0003-2450-3369"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei-Wei Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100571324","display_name":"Yao Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao Tian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100409741","display_name":"Jia Liu","orcid":"https://orcid.org/0000-0003-0383-0934"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia Liu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100779405"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8405,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.82089601,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"68","last_page":"72"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.8449325561523438},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7615180611610413},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7153772115707397},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6608132719993591},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.616170346736908},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.6126534938812256},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5939053297042847},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5861194133758545},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5407469272613525},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5058824419975281},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4232487380504608},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.41721051931381226},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13403400778770447},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1256035566329956}],"concepts":[{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.8449325561523438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7615180611610413},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7153772115707397},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6608132719993591},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.616170346736908},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.6126534938812256},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5939053297042847},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5861194133758545},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5407469272613525},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5058824419975281},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4232487380504608},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.41721051931381226},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13403400778770447},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1256035566329956},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/odyssey.2014-10","is_oa":false,"landing_page_url":"https://doi.org/10.21437/odyssey.2014-10","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2014)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6700000166893005,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W48148591","https://openalex.org/W943204654","https://openalex.org/W1571024744","https://openalex.org/W1940231550","https://openalex.org/W2041823554","https://openalex.org/W2079076391","https://openalex.org/W2119468495","https://openalex.org/W2130633305","https://openalex.org/W2143657265","https://openalex.org/W2144760012","https://openalex.org/W2150769028","https://openalex.org/W2153849757","https://openalex.org/W2154278880","https://openalex.org/W2399034162","https://openalex.org/W2408222853"],"related_works":["https://openalex.org/W2529301793","https://openalex.org/W2384121599","https://openalex.org/W2038083449","https://openalex.org/W2180954594","https://openalex.org/W3177678247","https://openalex.org/W1999617572","https://openalex.org/W2052835778","https://openalex.org/W4324119469","https://openalex.org/W2164868312","https://openalex.org/W2160650576"],"abstract_inverted_index":{"To":[0],"model":[1,33],"the":[2,44,65,76,83,106,134,138],"speech":[3,39,85],"utterance":[4,86],"at":[5],"a":[6,12,50,56,101,111],"finer":[7],"granularity,":[8],"this":[9,42],"paper":[10],"presents":[11],"novel":[13],"state-alignment":[14,27],"based":[15,35,119],"supervector":[16,141],"modeling":[17,37,46,142],"method":[18,28,47,113],"for":[19,117],"text-independent":[20,51],"speaker":[21,52],"verification,":[22],"which":[23],"takes":[24],"advantage":[25],"of":[26,78,153],"used":[29],"in":[30,38,92,127],"hidden":[31],"Markov":[32],"(HMM)":[34],"acoustic":[36],"recognition.":[40],"By":[41],"way,":[43],"proposed":[45,116,135],"can":[48],"convert":[49],"verification":[53],"problem":[54],"to":[55,89,99],"state-dependent":[57],"one.":[58],"Firstly,":[59],"phoneme":[60,80],"HMMs":[61],"are":[62],"trained.":[63],"Then":[64],"clustered":[66],"state":[67,93],"Gaussian":[68],"Mixture":[69],"Models":[70],"(GMM)":[71],"is":[72,87,114],"data-driven":[73],"trained":[74],"by":[75,144],"states":[77],"all":[79],"HMMs.":[81],"Next,":[82],"given":[84],"modeled":[88],"sub-GMM":[90],"supervectors":[91],"level":[94],"and":[95,150,155],"be":[96,100],"further":[97],"aligned":[98],"final":[102],"supervector.":[103],"Besides,":[104],"considering":[105],"duration":[107],"differences":[108],"between":[109],"states,":[110],"weighting":[112],"also":[115],"kernel":[118],"support":[120],"vector":[121],"machine":[122],"(SVM)":[123],"classification.":[124],"Experimental":[125],"results":[126],"SRE":[128],"2008":[129],"core-core":[130],"dataset":[131],"show":[132],"that":[133],"methods":[136],"outperform":[137],"traditional":[139],"GMM":[140],"followed":[143],"SVM":[145],"(GSV-SVM),":[146],"yielding":[147],"relative":[148],"8.4%":[149],"5.9%":[151],"improvements":[152],"EER":[154],"minDCF,":[156],"respectively.":[157]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
