{"id":"https://openalex.org/W2068865112","doi":"https://doi.org/10.1109/apsipa.2014.7041692","title":"Intrinsic variation robust speaker verification based on sparse representation","display_name":"Intrinsic variation robust speaker verification based on sparse representation","publication_year":2014,"publication_date":"2014-12-01","ids":{"openalex":"https://openalex.org/W2068865112","doi":"https://doi.org/10.1109/apsipa.2014.7041692","mag":"2068865112"},"language":"en","primary_location":{"id":"doi:10.1109/apsipa.2014.7041692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2014.7041692","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Signal and Information Processing Association Annual Summit and Conference (APSIPA), 2014 Asia-Pacific","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090138515","display_name":"Yi Han Nie","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yi Nie","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China","Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083894790","display_name":"Mingxing Xu","orcid":"https://orcid.org/0000-0002-3215-3496"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingxing Xu","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China","Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060610398","display_name":"Haishu Xianyu","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haishu Xianyu","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China","Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Key Laboratory of Pervasive Computing, Ministry of Education, Tsinghua National Laboratory for Information Science and Technology (TNList), Department of Computer Science and Technology, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5090138515"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.227,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.84807561,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"5","issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9758999943733215,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.7808394432067871},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6984947323799133},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.6484704613685608},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4938820004463196},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4449813961982727},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.43213897943496704},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.423700213432312},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41472938656806946},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4056841731071472}],"concepts":[{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.7808394432067871},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6984947323799133},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.6484704613685608},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4938820004463196},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4449813961982727},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.43213897943496704},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.423700213432312},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41472938656806946},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4056841731071472},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipa.2014.7041692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2014.7041692","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Signal and Information Processing Association Annual Summit and Conference (APSIPA), 2014 Asia-Pacific","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7400000095367432,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W152668300","https://openalex.org/W189651667","https://openalex.org/W1625928172","https://openalex.org/W1916834241","https://openalex.org/W2098742827","https://openalex.org/W2107638917","https://openalex.org/W2129812935","https://openalex.org/W2150769028","https://openalex.org/W2161428459","https://openalex.org/W2245139446","https://openalex.org/W2396843110","https://openalex.org/W3022380717","https://openalex.org/W6606286508","https://openalex.org/W6640010188","https://openalex.org/W6690606286"],"related_works":["https://openalex.org/W66821593","https://openalex.org/W4297807400","https://openalex.org/W1491159402","https://openalex.org/W4313854686","https://openalex.org/W321304764","https://openalex.org/W2249138175","https://openalex.org/W1521299571","https://openalex.org/W3162054169","https://openalex.org/W1516392727","https://openalex.org/W2140022733"],"abstract_inverted_index":{"Intrinsic":[0],"variation":[1,27,63,78],"is":[2],"one":[3],"of":[4,11,52,61,100,162],"the":[5,32,36,39,53,58,96,116,143,151],"major":[6],"factors":[7],"that":[8,115,142],"aggravate":[9],"performance":[10],"speaker":[12],"verification":[13],"system":[14,148],"dramatically.":[15],"In":[16,91],"this":[17],"paper,":[18],"we":[19,49,94],"focus":[20],"on":[21,75],"alleviating":[22],"influence":[23],"caused":[24],"by":[25,135],"intrinsic":[26,62,77],"using":[28],"sparse":[29,118,146],"representation.":[30],"Because":[31],"over-complete":[33],"dictionary":[34,54,69,72,105],"increases":[35],"flexibility":[37],"and":[38,70,80,88,127,137],"ability":[40],"to":[41,43,103],"adapt":[42],"variable":[44],"data":[45],"in":[46],"signal":[47],"representation,":[48],"expect":[50],"redundancy":[51],"could":[55],"benefit":[56],"addressing":[57],"implicit":[59],"properties":[60],"within":[64],"each":[65],"speaker.":[66],"Both":[67],"exemplar":[68],"learned":[71],"are":[73],"evaluated":[74],"an":[76,156],"corpus":[79],"compared":[81],"with":[82,106],"GMM-UBM,":[83,125],"Joint":[84],"Factor":[85],"Analysis":[86],"(JFA)":[87],"i-vector":[89,128],"systems.":[90],"our":[92],"system,":[93],"choose":[95],"K-SVD":[97,144],"algorithm,":[98],"generalization":[99],"K-means":[101],"algorithm":[102],"learn":[104],"Singular":[107],"Value":[108],"Decomposition":[109],"(SVD).":[110],"The":[111],"experiment":[112],"results":[113],"show":[114],"two":[117],"representation":[119,147],"systems":[120,129],"achieve":[121,155],"higher":[122],"accuracy":[123],"than":[124],"JFA":[126],"consistently,":[130],"especially":[131],"outperform":[132],"GMM-UBM":[133],"respectively":[134],"37.17%":[136],"41.55%.":[138],"We":[139],"also":[140],"find":[141],"based":[145],"has":[149],"almost":[150],"best":[152],"performance,":[153],"which":[154],"average":[157],"Error":[158],"Equal":[159],"Rate":[160],"(EER)":[161],"14.23%.":[163]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
