{"id":"https://openalex.org/W4390187207","doi":"https://doi.org/10.1109/taslp.2023.3346293","title":"Review of Methods for Automatic Speaker Verification","display_name":"Review of Methods for Automatic Speaker Verification","publication_year":2023,"publication_date":"2023-12-25","ids":{"openalex":"https://openalex.org/W4390187207","doi":"https://doi.org/10.1109/taslp.2023.3346293"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2023.3346293","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3346293","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011489869","display_name":"Douglas O\u2019Shaughnessy","orcid":"https://orcid.org/0000-0002-0110-2346"},"institutions":[{"id":"https://openalex.org/I39481719","display_name":"Institut National de la Recherche Scientifique","ror":"https://ror.org/04td37d32","country_code":"CA","type":"education","lineage":["https://openalex.org/I39481719","https://openalex.org/I49663120"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Douglas O'Shaughnessy","raw_affiliation_strings":["Institut national de la recherche scientifique Centre energie Materiaux Telecommunications, Montreal, Quebec, Canada"],"affiliations":[{"raw_affiliation_string":"Institut national de la recherche scientifique Centre energie Materiaux Telecommunications, Montreal, Quebec, Canada","institution_ids":["https://openalex.org/I39481719"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5011489869"],"corresponding_institution_ids":["https://openalex.org/I39481719"],"apc_list":null,"apc_paid":null,"fwci":0.3491,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67563641,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"32","issue":null,"first_page":"1776","last_page":"1789"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7837522029876709},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7823229432106018},{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.6320502161979675},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.6045776605606079},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.6007809042930603},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.6004716157913208},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5306687951087952},{"id":"https://openalex.org/keywords/linear-prediction","display_name":"Linear prediction","score":0.4669032692909241},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.46626123785972595},{"id":"https://openalex.org/keywords/spectral-envelope","display_name":"Spectral envelope","score":0.4435039162635803},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4155268669128418},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32303881645202637},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.24759796261787415}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7837522029876709},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7823229432106018},{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.6320502161979675},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.6045776605606079},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.6007809042930603},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6004716157913208},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5306687951087952},{"id":"https://openalex.org/C131109320","wikidata":"https://www.wikidata.org/wiki/Q581012","display_name":"Linear prediction","level":2,"score":0.4669032692909241},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.46626123785972595},{"id":"https://openalex.org/C54926389","wikidata":"https://www.wikidata.org/wiki/Q7575188","display_name":"Spectral envelope","level":2,"score":0.4435039162635803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4155268669128418},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32303881645202637},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.24759796261787415},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2023.3346293","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3346293","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2516803194","display_name":null,"funder_award_id":"142610","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":109,"referenced_works":["https://openalex.org/W114428419","https://openalex.org/W1523682477","https://openalex.org/W1533303231","https://openalex.org/W1563235770","https://openalex.org/W1916834241","https://openalex.org/W1936725236","https://openalex.org/W1964357740","https://openalex.org/W1966264494","https://openalex.org/W1970352604","https://openalex.org/W1985690171","https://openalex.org/W1989702938","https://openalex.org/W1996171898","https://openalex.org/W1999405202","https://openalex.org/W2025164940","https://openalex.org/W2026554312","https://openalex.org/W2040266692","https://openalex.org/W2041823554","https://openalex.org/W2045956438","https://openalex.org/W2046056978","https://openalex.org/W2050693797","https://openalex.org/W2057038408","https://openalex.org/W2059529407","https://openalex.org/W2064675550","https://openalex.org/W2078169166","https://openalex.org/W2078455576","https://openalex.org/W2078953162","https://openalex.org/W2080794664","https://openalex.org/W2091425152","https://openalex.org/W2101556109","https://openalex.org/W2101927907","https://openalex.org/W2114925438","https://openalex.org/W2121415728","https://openalex.org/W2121551440","https://openalex.org/W2121750345","https://openalex.org/W2123768812","https://openalex.org/W2123867168","https://openalex.org/W2125838338","https://openalex.org/W2128391065","https://openalex.org/W2130806807","https://openalex.org/W2132549764","https://openalex.org/W2135034868","https://openalex.org/W2136879537","https://openalex.org/W2137075158","https://openalex.org/W2141278204","https://openalex.org/W2144760012","https://openalex.org/W2146173625","https://openalex.org/W2148154194","https://openalex.org/W2150769028","https://openalex.org/W2154278880","https://openalex.org/W2155798363","https://openalex.org/W2156909104","https://openalex.org/W2163065939","https://openalex.org/W2163181067","https://openalex.org/W2167191127","https://openalex.org/W2170065313","https://openalex.org/W2180748755","https://openalex.org/W2187089797","https://openalex.org/W2395750323","https://openalex.org/W2516631658","https://openalex.org/W2592168896","https://openalex.org/W2747165665","https://openalex.org/W2752782242","https://openalex.org/W2770454110","https://openalex.org/W2784163702","https://openalex.org/W2801581493","https://openalex.org/W2888728157","https://openalex.org/W2888968865","https://openalex.org/W2916104401","https://openalex.org/W2963127163","https://openalex.org/W2964052309","https://openalex.org/W2969656782","https://openalex.org/W2969985801","https://openalex.org/W2972668418","https://openalex.org/W2972992051","https://openalex.org/W2981022124","https://openalex.org/W2981087920","https://openalex.org/W2982474723","https://openalex.org/W3008712156","https://openalex.org/W3015791598","https://openalex.org/W3022104823","https://openalex.org/W3023104975","https://openalex.org/W3024388846","https://openalex.org/W3024869864","https://openalex.org/W3026777299","https://openalex.org/W3035725276","https://openalex.org/W3096029132","https://openalex.org/W3098926221","https://openalex.org/W3103152812","https://openalex.org/W3105202226","https://openalex.org/W3137249133","https://openalex.org/W3141035251","https://openalex.org/W3142516134","https://openalex.org/W3171302872","https://openalex.org/W3201773091","https://openalex.org/W3209059054","https://openalex.org/W3212886388","https://openalex.org/W4206319965","https://openalex.org/W4214568179","https://openalex.org/W4288091954","https://openalex.org/W4289752563","https://openalex.org/W4297841461","https://openalex.org/W4297841768","https://openalex.org/W4300985418","https://openalex.org/W6713727690","https://openalex.org/W6743520202","https://openalex.org/W6747381837","https://openalex.org/W6751420435","https://openalex.org/W6769178842","https://openalex.org/W6780218876"],"related_works":["https://openalex.org/W2100012411","https://openalex.org/W1482212662","https://openalex.org/W3162157266","https://openalex.org/W2162084437","https://openalex.org/W1997579527","https://openalex.org/W2102353451","https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W2394579548"],"abstract_inverted_index":{"A":[0],"review":[1],"of":[2,16,52,62,66,78,80,91,134],"techniques":[3],"to":[4,82,121,143],"identify":[5],"speakers":[6],"from":[7,41,59,75],"their":[8,84],"voices":[9],"is":[10,43,129],"presented,":[11],"noting":[12],"strengths":[13],"and":[14,29,47,103,115],"weaknesses":[15],"various":[17,132],"methods.":[18],"Similar":[19],"acoustic":[20],"analysis":[21,95],"has":[22],"been":[23],"often":[24],"used":[25],"for":[26,55,124],"both":[27],"speech":[28,57,94,126],"speaker":[30,139],"recognition,":[31],"despite":[32],"the":[33,50,63,67,76],"two":[34],"tasks":[35],"being":[36],"quite":[37],"different.":[38],"Speaker":[39],"biometrics":[40],"voice":[42],"far":[44],"more":[45],"indirect":[46],"subtle":[48],"than":[49],"estimation":[51],"phoneme":[53],"sequences":[54],"automatic":[56,138],"recognition":[58],"periodic":[60],"evaluations":[61],"spectral":[64],"envelope":[65],"vocal":[68],"tract":[69],"output.":[70],"Speech":[71],"signals":[72],"are":[73,106,119,147],"discussed":[74],"point":[77],"view":[79],"how":[81,131],"recognize":[83],"textual":[85],"content":[86],"versus":[87],"estimating":[88],"other":[89],"aspects":[90],"speakers.":[92],"Common":[93],"methods":[96,146],"such":[97,109],"as":[98,110],"filter":[99],"banks,":[100],"linear":[101],"prediction,":[102],"mel-frequency":[104],"cepstrum":[105],"examined.":[107],"Approaches":[108],"hidden":[111],"Markov":[112],"models,":[113],"i-vectors,":[114],"artificial":[116],"neural":[117],"networks":[118,135],"shown":[120],"be":[122],"useful":[123],"multiple":[125],"applications.":[127],"Focus":[128],"on":[130],"types":[133],"can":[136],"accomplish":[137],"verification":[140],"(ASV).":[141],"Suggestions":[142],"improve":[144],"these":[145],"made.":[148]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
