{"id":"https://openalex.org/W2036497443","doi":"https://doi.org/10.1109/icassp.2014.6854355","title":"Construction of discriminative Kernels from known and unknown non-targets for PLDA-SVM scoring","display_name":"Construction of discriminative Kernels from known and unknown non-targets for PLDA-SVM scoring","publication_year":2014,"publication_date":"2014-05-01","ids":{"openalex":"https://openalex.org/W2036497443","doi":"https://doi.org/10.1109/icassp.2014.6854355","mag":"2036497443"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2014.6854355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6854355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035226758","display_name":"Wei Rao","orcid":"https://orcid.org/0000-0002-7237-0874"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Wei Rao","raw_affiliation_strings":["Dept. of Electronic and Information Engineering, Hong Kong Polytechnic University, Hong Kong SAR, China","Dept. of Electron. & Inf. Eng., Hong Kong Polytech. Univ., Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electronic and Information Engineering, Hong Kong Polytechnic University, Hong Kong SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Dept. of Electron. & Inf. Eng., Hong Kong Polytech. Univ., Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068768998","display_name":"Man\u2010Wai Mak","orcid":"https://orcid.org/0000-0001-8854-3760"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Man-Wai Mak","raw_affiliation_strings":["Dept. of Electronic and Information Engineering, Hong Kong Polytechnic University, Hong Kong SAR, China","Dept. of Electron. & Inf. Eng., Hong Kong Polytech. Univ., Hong Kong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electronic and Information Engineering, Hong Kong Polytechnic University, Hong Kong SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Dept. of Electron. & Inf. Eng., Hong Kong Polytech. Univ., Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6916,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.87556001,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"15","issue":null,"first_page":"4012","last_page":"4016"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.8525561094284058},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.776667594909668},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6945673227310181},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6717932224273682},{"id":"https://openalex.org/keywords/resampling","display_name":"Resampling","score":0.5772247314453125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.562095046043396},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.5350445508956909},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5132339000701904},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5104783773422241},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5041021108627319},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4872974157333374},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.46527737379074097},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.43127915263175964},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33722037076950073},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1282823085784912},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.08792361617088318}],"concepts":[{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.8525561094284058},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.776667594909668},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6945673227310181},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6717932224273682},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.5772247314453125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.562095046043396},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.5350445508956909},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5132339000701904},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5104783773422241},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5041021108627319},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4872974157333374},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.46527737379074097},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.43127915263175964},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33722037076950073},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1282823085784912},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.08792361617088318}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2014.6854355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6854355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:ira.lib.polyu.edu.hk:10397/29533","is_oa":false,"landing_page_url":"http://hdl.handle.net/10397/29533","pdf_url":null,"source":{"id":"https://openalex.org/S4306400205","display_name":"PolyU Institutional Research Archive (Hong Kong Polytechnic University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I14243506","host_organization_name":"Hong Kong Polytechnic University","host_organization_lineage":["https://openalex.org/I14243506"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6899999976158142}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1663973292","https://openalex.org/W1916834241","https://openalex.org/W1985043720","https://openalex.org/W1994244061","https://openalex.org/W2002854845","https://openalex.org/W2035732044","https://openalex.org/W2041823554","https://openalex.org/W2050693797","https://openalex.org/W2070752897","https://openalex.org/W2078953162","https://openalex.org/W2088032561","https://openalex.org/W2107638917","https://openalex.org/W2121812409","https://openalex.org/W2121890799","https://openalex.org/W2129066450","https://openalex.org/W2136879537","https://openalex.org/W2139634554","https://openalex.org/W2140389641","https://openalex.org/W2143694533","https://openalex.org/W2144760012","https://openalex.org/W2147147599","https://openalex.org/W2150769028","https://openalex.org/W2156913409","https://openalex.org/W2395747372","https://openalex.org/W2395750323","https://openalex.org/W2397634864","https://openalex.org/W2406312423","https://openalex.org/W2407342067","https://openalex.org/W2595142274","https://openalex.org/W4212863985","https://openalex.org/W6640010188","https://openalex.org/W6712325649","https://openalex.org/W6713727690"],"related_works":["https://openalex.org/W2118039276","https://openalex.org/W2206035908","https://openalex.org/W2162158162","https://openalex.org/W4247736853","https://openalex.org/W1493012537","https://openalex.org/W1999004162","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W2696990509"],"abstract_inverted_index":{"Conventional":[0],"PLDA":[1,46],"scoring":[2,35,99,174],"in":[3,33,65,81,132,135,171],"i-vector":[4],"speaker":[5],"verification":[6,83],"involves":[7],"the":[8,28,34,53,73,95,102,112,118,136,149,182,186,193,197,202],"i-vectors":[9,57,159],"of":[10,30,55,75,97,105,157,184,219],"target":[11,60,123],"speakers":[12,32,124,213],"and":[13,108,138,167,188,195],"claimants":[14],"only.":[15],"We":[16],"have":[17,125],"previously":[18],"demonstrated":[19],"that":[20,147,196],"better":[21,173,208],"performance":[22,96],"can":[23,160,200],"be":[24,161],"achieved":[25,42],"by":[26,43,100,163],"incorporating":[27],"information":[29,74],"background":[31],"process":[36],"via":[37],"speaker-dependent":[38,119],"SVMs.":[39,120,175],"This":[40,144],"is":[41,152],"defining":[44],"a":[45,155,216],"score":[47,103],"space":[48],"with":[49,214],"dimension":[50],"equal":[51],"to":[52,71,93,116,206],"number":[54,156,218],"training":[56,192,204],"for":[58,141,191,211],"each":[59,82],"speaker.":[61],"The":[62],"new":[63,91],"protocol":[64,92],"NIST":[66,178],"2012":[67,179],"SRE":[68,180],"permits":[69],"systems":[70],"use":[72],"other":[76],"target-speakers":[77],"(called":[78],"known":[79,107,187],"non-targets)":[80],"trial.":[84],"In":[85],"this":[86,90],"paper,":[87],"we":[88],"exploit":[89],"enhance":[94],"PLDA-SVM":[98],"using":[101],"vectors":[104],"both":[106],"unknown":[109,189],"non-targets":[110,190],"as":[111],"impostor":[113],"class":[114],"data":[115,140],"train":[117],"Because":[121],"some":[122],"one":[126],"enrollment":[127,150,220],"utterance":[128,151,165],"only,":[129],"which":[130],"results":[131],"severe":[133],"imbalance":[134],"speaker-":[137],"impostor-class":[139],"SVM":[142,203],"training.":[143],"paper":[145],"shows":[146],"if":[148],"sufficiently":[153],"long,":[154],"target-speaker":[158],"generated":[162],"an":[164],"partitioning":[166],"resampling":[168,198],"technique,":[169],"resulting":[170],"much":[172],"Results":[176],"on":[177],"demonstrate":[181],"advantages":[183],"pooling":[185],"SVMs":[194],"techniques":[199],"help":[201],"algorithm":[205],"find":[207],"decision":[209],"boundaries":[210],"those":[212],"only":[215],"small":[217],"utterances.":[221]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
