{"id":"https://openalex.org/W4382536354","doi":"https://doi.org/10.1109/lsp.2023.3290832","title":"A Fused Speech Enhancement Framework for Robust Speaker Verification","display_name":"A Fused Speech Enhancement Framework for Robust Speaker Verification","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4382536354","doi":"https://doi.org/10.1109/lsp.2023.3290832"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2023.3290832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3290832","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049638215","display_name":"Yanfeng Wu","orcid":"https://orcid.org/0000-0002-1498-9177"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanfeng Wu","raw_affiliation_strings":["College of Artificial Intelligence, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021697903","display_name":"Taihao Li","orcid":"https://orcid.org/0000-0003-3279-7125"},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Taihao Li","raw_affiliation_strings":["Department of Artificial Intelligence, Zhejiang Lab, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence, Zhejiang Lab, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012579399","display_name":"Junan Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junan Zhao","raw_affiliation_strings":["College of Artificial Intelligence, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101729503","display_name":"Qirui Wang","orcid":"https://orcid.org/0000-0003-3653-2984"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qirui Wang","raw_affiliation_strings":["College of Artificial Intelligence, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042066408","display_name":"Jing Xu","orcid":"https://orcid.org/0000-0001-8532-2241"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Xu","raw_affiliation_strings":["College of Artificial Intelligence, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5049638215"],"corresponding_institution_ids":["https://openalex.org/I205237279"],"apc_list":null,"apc_paid":null,"fwci":1.222,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.8294214,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"30","issue":null,"first_page":"883","last_page":"887"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8062237501144409},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7829335927963257},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.6189500093460083},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.6028500199317932},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5878396034240723},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5352523922920227},{"id":"https://openalex.org/keywords/noise-measurement","display_name":"Noise measurement","score":0.5195763111114502},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.517922580242157},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4777921140193939},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.4554426968097687},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4510400593280792},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.4349093735218048},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4254087209701538},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42382875084877014},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.4146490693092346},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06351152062416077}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8062237501144409},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7829335927963257},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.6189500093460083},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.6028500199317932},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5878396034240723},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5352523922920227},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.5195763111114502},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.517922580242157},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4777921140193939},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.4554426968097687},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4510400593280792},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.4349093735218048},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4254087209701538},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42382875084877014},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.4146490693092346},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06351152062416077},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C103038307","wikidata":"https://www.wikidata.org/wiki/Q6556360","display_name":"Lipid bilayer fusion","level":3,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2023.3290832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3290832","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.4000000059604645}],"awards":[{"id":"https://openalex.org/G3830000997","display_name":null,"funder_award_id":"21JCYBJC00110","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"},{"id":"https://openalex.org/G8225404974","display_name":null,"funder_award_id":"62002177","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8559640209","display_name":null,"funder_award_id":"19JCQNJC00300","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323993","display_name":"Natural Science Foundation of Tianjin City","ror":null},{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2194775991","https://openalex.org/W2219249508","https://openalex.org/W2311973309","https://openalex.org/W2605589342","https://openalex.org/W2696967604","https://openalex.org/W2718701456","https://openalex.org/W2726515241","https://openalex.org/W2746457594","https://openalex.org/W2784163702","https://openalex.org/W2890964092","https://openalex.org/W2916104401","https://openalex.org/W2922509574","https://openalex.org/W2937813194","https://openalex.org/W2962866211","https://openalex.org/W2962914040","https://openalex.org/W2963127163","https://openalex.org/W2972425344","https://openalex.org/W2972443522","https://openalex.org/W2982037672","https://openalex.org/W3013020904","https://openalex.org/W3015598461","https://openalex.org/W3024301174","https://openalex.org/W3024869864","https://openalex.org/W3025783616","https://openalex.org/W3088315586","https://openalex.org/W3091570562","https://openalex.org/W3096964161","https://openalex.org/W3103152812","https://openalex.org/W3137249133","https://openalex.org/W3141035251","https://openalex.org/W3174649707","https://openalex.org/W3196650842","https://openalex.org/W3197013563","https://openalex.org/W3198742213","https://openalex.org/W4221154746","https://openalex.org/W4225682608","https://openalex.org/W4288091954","https://openalex.org/W6631190155","https://openalex.org/W6688816777","https://openalex.org/W6739720703","https://openalex.org/W6769178842"],"related_works":["https://openalex.org/W4375869276","https://openalex.org/W4221152531","https://openalex.org/W2401410855","https://openalex.org/W2970290810","https://openalex.org/W2046186789","https://openalex.org/W2355125052","https://openalex.org/W2076268407","https://openalex.org/W2810291168","https://openalex.org/W2116686031","https://openalex.org/W2744059046"],"abstract_inverted_index":{"Robust":[0],"speaker":[1,138],"verification":[2],"(RSV)":[3],"under":[4],"noisy":[5],"con-":[6],"ditions":[7],"is":[8],"still":[9],"a":[10,60,109],"challenging":[11],"task.":[12,54],"Recently,":[13],"some":[14],"task-specific":[15],"speech":[16],"enhancement":[17],"(SE)":[18],"approaches":[19],"are":[20,91],"proposed":[21],"and":[22,39,72,82,102,130,142,156],"achieve":[23],"excellent":[24],"performance":[25,50,162],"on":[26,94,147],"RSV.":[27],"However,":[28],"all":[29],"these":[30],"works":[31],"adopt":[32],"only":[33,128],"one":[34],"kind":[35],"of":[36,51,97,163],"SE":[37,62,76],"network":[38],"thus":[40],"can":[41,126,159],"not":[42,127],"remove":[43],"noise":[44,141],"from":[45],"different":[46],"aspects,":[47],"limiting":[48],"the":[49,52,84,118,122,148,154,157,161],"RSV":[53,164],"In":[55,105],"this":[56],"letter,":[57],"we":[58,107],"propose":[59],"fused":[61],"framework":[63],"(FSEF)":[64],"for":[65],"RSV,":[66],"which":[67],"integrates":[68],"both":[69,153],"T-F":[70],"masking-based":[71],"feature":[73,103],"mapping-":[74],"based":[75,93],"networks":[77],"to":[78,166],"collect":[79],"complementary":[80],"information":[81],"improve":[83,160],"robustness":[85],"against":[86,140],"noise.":[87],"Two":[88],"FESF-RSV":[89],"systems":[90],"constructed":[92],"two":[95],"kinds":[96],"fusion":[98,101],"methods:":[99],"score":[100],"fusion.":[104],"addition,":[106],"present":[108],"Multi-":[110],"Scale":[111],"Attentive":[112],"Context":[113],"Aggregation":[114],"Network":[115],"(MSACAN)":[116],"as":[117],"backbone":[119],"structure":[120],"in":[121],"FSEF.":[123],"The":[124],"MSACAN":[125,158],"extract":[129],"fuse":[131],"multi-scale":[132],"features":[133],"adaptively":[134],"but":[135],"also":[136],"enhance":[137],"characteristics":[139],"interfering":[143],"speakers.":[144],"Experiments":[145],"conducted":[146],"noise-simulated":[149],"VoxCeleb1":[150],"dataset":[151],"demonstrate":[152],"FSEF":[155],"compared":[165],"previous":[167],"approaches.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
