{"id":"https://openalex.org/W2145846419","doi":"https://doi.org/10.1109/taslp.2015.2442757","title":"SNR-Invariant PLDA Modeling in Nonparametric Subspace for Robust Speaker Verification","display_name":"SNR-Invariant PLDA Modeling in Nonparametric Subspace for Robust Speaker Verification","publication_year":2015,"publication_date":"2015-06-09","ids":{"openalex":"https://openalex.org/W2145846419","doi":"https://doi.org/10.1109/taslp.2015.2442757","mag":"2145846419"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2015.2442757","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2015.2442757","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://ira.lib.polyu.edu.hk/bitstream/10397/16012/1/SNR-invariant_PLDmodeling_Nonparametric.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100368199","display_name":"Na Li","orcid":"https://orcid.org/0000-0003-2669-0233"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Na Li","raw_affiliation_strings":["The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong SAR, China","The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, China"],"affiliations":[{"raw_affiliation_string":"The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068768998","display_name":"Man\u2010Wai Mak","orcid":"https://orcid.org/0000-0001-8854-3760"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Man-Wai Mak","raw_affiliation_strings":["The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong SAR, China","The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, China"],"affiliations":[{"raw_affiliation_string":"The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, Hong Kong SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"The Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Hung Hom, China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100368199"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":9.4918,"has_fulltext":true,"cited_by_count":41,"citation_normalized_percentile":{"value":0.97943157,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"23","issue":"10","first_page":"1648","last_page":"1659"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9847999811172485,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7570482492446899},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.727103590965271},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6724703311920166},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6179168820381165},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5637056231498718},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.5550106167793274},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5479791164398193},{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.5394706130027771},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4459823966026306},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.43179967999458313},{"id":"https://openalex.org/keywords/nonparametric-statistics","display_name":"Nonparametric statistics","score":0.41748344898223877},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.41475600004196167},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4008103013038635},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27017587423324585},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11436104774475098}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7570482492446899},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.727103590965271},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6724703311920166},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6179168820381165},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5637056231498718},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.5550106167793274},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5479791164398193},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.5394706130027771},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4459823966026306},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.43179967999458313},{"id":"https://openalex.org/C102366305","wikidata":"https://www.wikidata.org/wiki/Q1097688","display_name":"Nonparametric statistics","level":2,"score":0.41748344898223877},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.41475600004196167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4008103013038635},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27017587423324585},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11436104774475098},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2015.2442757","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2015.2442757","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:ira.lib.polyu.edu.hk:10397/16012","is_oa":true,"landing_page_url":"http://hdl.handle.net/10397/16012","pdf_url":"http://ira.lib.polyu.edu.hk/bitstream/10397/16012/1/SNR-invariant_PLDmodeling_Nonparametric.pdf","source":{"id":"https://openalex.org/S4306400205","display_name":"PolyU Institutional Research Archive (Hong Kong Polytechnic University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I14243506","host_organization_name":"Hong Kong Polytechnic University","host_organization_lineage":["https://openalex.org/I14243506"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal/Magazine Article"}],"best_oa_location":{"id":"pmh:oai:ira.lib.polyu.edu.hk:10397/16012","is_oa":true,"landing_page_url":"http://hdl.handle.net/10397/16012","pdf_url":"http://ira.lib.polyu.edu.hk/bitstream/10397/16012/1/SNR-invariant_PLDmodeling_Nonparametric.pdf","source":{"id":"https://openalex.org/S4306400205","display_name":"PolyU Institutional Research Archive (Hong Kong Polytechnic University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I14243506","host_organization_name":"Hong Kong Polytechnic University","host_organization_lineage":["https://openalex.org/I14243506"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal/Magazine Article"},"sustainable_development_goals":[{"score":0.7200000286102295,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G4271622844","display_name":null,"funder_award_id":"G-YN18","funder_id":"https://openalex.org/F4320322598","funder_display_name":"Hong Kong Polytechnic University"}],"funders":[{"id":"https://openalex.org/F4320322598","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2145846419.pdf","grobid_xml":"https://content.openalex.org/works/W2145846419.grobid-xml"},"referenced_works_count":62,"referenced_works":["https://openalex.org/W111477576","https://openalex.org/W204053250","https://openalex.org/W775331923","https://openalex.org/W1501458753","https://openalex.org/W1506806321","https://openalex.org/W1512532673","https://openalex.org/W1540327379","https://openalex.org/W1586405805","https://openalex.org/W1663973292","https://openalex.org/W1770825568","https://openalex.org/W1916834241","https://openalex.org/W1964422643","https://openalex.org/W1970748944","https://openalex.org/W1970872899","https://openalex.org/W1992975485","https://openalex.org/W1994244061","https://openalex.org/W2002854845","https://openalex.org/W2034626437","https://openalex.org/W2041823554","https://openalex.org/W2050693797","https://openalex.org/W2055611715","https://openalex.org/W2080794664","https://openalex.org/W2090716422","https://openalex.org/W2105393821","https://openalex.org/W2121061347","https://openalex.org/W2121750345","https://openalex.org/W2121812409","https://openalex.org/W2129066450","https://openalex.org/W2129379984","https://openalex.org/W2135346934","https://openalex.org/W2136879537","https://openalex.org/W2142799607","https://openalex.org/W2143054781","https://openalex.org/W2144760012","https://openalex.org/W2150769028","https://openalex.org/W2154278880","https://openalex.org/W2159736522","https://openalex.org/W2168056867","https://openalex.org/W2168959749","https://openalex.org/W2295897503","https://openalex.org/W2395069802","https://openalex.org/W2395750323","https://openalex.org/W2396361679","https://openalex.org/W2397634864","https://openalex.org/W2400341349","https://openalex.org/W2401027203","https://openalex.org/W2406312423","https://openalex.org/W2406521968","https://openalex.org/W2407231000","https://openalex.org/W2407342067","https://openalex.org/W3145164839","https://openalex.org/W4212863985","https://openalex.org/W4246070010","https://openalex.org/W4298164478","https://openalex.org/W6622345507","https://openalex.org/W6632370842","https://openalex.org/W6635268374","https://openalex.org/W6712094196","https://openalex.org/W6712325649","https://openalex.org/W6712861115","https://openalex.org/W6713727690","https://openalex.org/W6714201320"],"related_works":["https://openalex.org/W66821593","https://openalex.org/W2053159670","https://openalex.org/W2051274299","https://openalex.org/W3148366653","https://openalex.org/W1521299571","https://openalex.org/W468945283","https://openalex.org/W3141593045","https://openalex.org/W204267554","https://openalex.org/W2134501921","https://openalex.org/W4252590334"],"abstract_inverted_index":{"While":[0],"i-vector/PLDA":[1],"framework":[2,35,141],"has":[3],"achieved":[4],"great":[5],"success,":[6],"its":[7],"performance":[8,144],"still":[9],"degrades":[10],"dramatically":[11],"under":[12],"noisy":[13],"conditions.":[14],"To":[15],"compensate":[16],"for":[17,36],"the":[18,53,58,63,68,77,96,115,127,139,148],"variability":[19,116],"of":[20,26,106,154],"i-vectors":[21],"caused":[22],"by":[23],"different":[24],"levels":[25],"background":[27],"noise,":[28],"this":[29],"paper":[30],"proposes":[31],"an":[32,84,88],"SNR-invariant":[33,71],"PLDA":[34,72,150],"robust":[37],"speaker":[38],"verification.":[39],"First,":[40],"nonparametric":[41],"feature":[42],"analysis":[43],"(NFA)":[44],"is":[45,73],"employed":[46],"to":[47,75,118],"suppress":[48],"intra-speaker":[49],"variation":[50],"and":[51,87,111,120,151],"emphasize":[52],"discriminative":[54],"information":[55,79,82],"inherited":[56],"in":[57,62,67,95],"boundaries":[59],"between":[60],"speakers":[61],"i-vector":[64,94],"space.":[65],"Then,":[66],"NFA-projected":[69],"subspace,":[70],"applied":[74],"separate":[76],"SNR-specific":[78],"from":[80],"speaker-specific":[81],"using":[83],"identity":[85],"factor":[86],"SNR":[89,119],"factor.":[90],"Accordingly,":[91],"a":[92,103],"projected":[93],"NFA":[97],"subspace":[98],"can":[99],"be":[100],"represented":[101],"as":[102],"linear":[104],"combination":[105],"three":[107],"components:":[108],"speaker,":[109],"SNR,":[110],"channel.":[112],"During":[113],"verification,":[114],"due":[117],"channels":[121],"are":[122],"integrated":[123],"out":[124],"when":[125,145],"computing":[126],"marginal":[128],"likelihood":[129],"ratio.":[130],"Experiments":[131],"based":[132],"on":[133],"NIST":[134],"2012":[135],"SRE":[136],"show":[137],"that":[138],"proposed":[140],"achieves":[142],"superior":[143],"compared":[146],"with":[147],"conventional":[149],"SNR-dependent":[152],"mixture":[153],"PLDA.":[155]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":9},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
