{"id":"https://openalex.org/W4389633906","doi":"https://doi.org/10.1109/access.2023.3341919","title":"Phase-Aware Speech Enhancement With Complex Wiener Filter","display_name":"Phase-Aware Speech Enhancement With Complex Wiener Filter","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4389633906","doi":"https://doi.org/10.1109/access.2023.3341919"},"language":"en","primary_location":{"id":"doi:10.1109/access.2023.3341919","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3341919","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10354333.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10354333.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101841313","display_name":"Huy Toan Nguyen","orcid":"https://orcid.org/0009-0008-6274-735X"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Huy Nguyen","raw_affiliation_strings":["Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","institution_ids":["https://openalex.org/I177738480"]},{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083304186","display_name":"Tuan Vu Ho","orcid":"https://orcid.org/0000-0001-6819-0443"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]},{"id":"https://openalex.org/I4210153682","display_name":"Intelligent Health (United Kingdom)","ror":"https://ror.org/0576zak10","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210153682"]}],"countries":["GB","JP"],"is_corresponding":false,"raw_author_name":"Tuan Vu Ho","raw_affiliation_strings":["Media Intelligent Processing Reseach Department, Advanced Artificial Intelligent Innovation Center, Hitachi Ltd, Tokyo, Japan","Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan"],"affiliations":[{"raw_affiliation_string":"Media Intelligent Processing Reseach Department, Advanced Artificial Intelligent Innovation Center, Hitachi Ltd, Tokyo, Japan","institution_ids":["https://openalex.org/I4210153682"]},{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055059119","display_name":"Masato Akagi","orcid":"https://orcid.org/0000-0003-2450-6754"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masato Akagi","raw_affiliation_strings":["Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","institution_ids":["https://openalex.org/I177738480"]},{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014199725","display_name":"Masashi Unoki","orcid":"https://orcid.org/0000-0002-6605-2052"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masashi Unoki","raw_affiliation_strings":["Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Ishikawa, Nomi, Japan","institution_ids":["https://openalex.org/I177738480"]},{"raw_affiliation_string":"Graduate School of Advanced Science and Technology, Japan Advanced Institute of Science and Technology (JAIST), Nomi, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101841313"],"corresponding_institution_ids":["https://openalex.org/I177738480"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.3927,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.59461967,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"11","issue":null,"first_page":"141573","last_page":"141584"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.8166508674621582},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7331967353820801},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6048133969306946},{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.5505275726318359},{"id":"https://openalex.org/keywords/wiener-filter","display_name":"Wiener filter","score":0.49707868695259094},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.4597087502479553},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.43820685148239136},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40467241406440735},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38606521487236023},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.29645708203315735},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.20355471968650818}],"concepts":[{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.8166508674621582},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7331967353820801},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6048133969306946},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.5505275726318359},{"id":"https://openalex.org/C18537770","wikidata":"https://www.wikidata.org/wiki/Q25523","display_name":"Wiener filter","level":2,"score":0.49707868695259094},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.4597087502479553},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.43820685148239136},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40467241406440735},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38606521487236023},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.29645708203315735},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.20355471968650818},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2023.3341919","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3341919","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10354333.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:eaaa6b59af1947aa8efd515f9e552272","is_oa":true,"landing_page_url":"https://doaj.org/article/eaaa6b59af1947aa8efd515f9e552272","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 11, Pp 141573-141584 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2023.3341919","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3341919","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10354333.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5600000023841858}],"awards":[{"id":"https://openalex.org/G3635912132","display_name":null,"funder_award_id":"20KK0233","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7223476060","display_name":null,"funder_award_id":"21H03463","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4389633906.pdf","grobid_xml":"https://content.openalex.org/works/W4389633906.grobid-xml"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W160800111","https://openalex.org/W190004713","https://openalex.org/W1552314771","https://openalex.org/W2013590534","https://openalex.org/W2022554507","https://openalex.org/W2027840501","https://openalex.org/W2039844283","https://openalex.org/W2044893557","https://openalex.org/W2067295501","https://openalex.org/W2070126272","https://openalex.org/W2094721231","https://openalex.org/W2113131123","https://openalex.org/W2128653836","https://openalex.org/W2291877678","https://openalex.org/W2405774341","https://openalex.org/W2514828952","https://openalex.org/W2752796333","https://openalex.org/W2766672686","https://openalex.org/W2790760353","https://openalex.org/W2802304149","https://openalex.org/W2883322837","https://openalex.org/W2889597349","https://openalex.org/W2949756029","https://openalex.org/W2952218014","https://openalex.org/W2963341071","https://openalex.org/W2963452667","https://openalex.org/W3045520545","https://openalex.org/W3081955528","https://openalex.org/W3089425003","https://openalex.org/W3092864146","https://openalex.org/W3095057960","https://openalex.org/W3096408984","https://openalex.org/W3097312999","https://openalex.org/W3099330747","https://openalex.org/W3100270690","https://openalex.org/W3117879684","https://openalex.org/W3120336970","https://openalex.org/W3131332223","https://openalex.org/W3135915893","https://openalex.org/W3147539069","https://openalex.org/W3160085755","https://openalex.org/W3198680319","https://openalex.org/W3199367817","https://openalex.org/W4225298533","https://openalex.org/W4232282348","https://openalex.org/W4297841734","https://openalex.org/W6640963894","https://openalex.org/W6729448088","https://openalex.org/W6738884980","https://openalex.org/W6751512325","https://openalex.org/W6757632829","https://openalex.org/W6762114000","https://openalex.org/W6798721538"],"related_works":["https://openalex.org/W2106793170","https://openalex.org/W1577562165","https://openalex.org/W2028846388","https://openalex.org/W4295210860","https://openalex.org/W2072015625","https://openalex.org/W2117955483","https://openalex.org/W2161534637","https://openalex.org/W2029794884","https://openalex.org/W2010870899","https://openalex.org/W1986772939"],"abstract_inverted_index":{"In":[0],"speech":[1,9,13,61,75,154,187,228],"enhancement,":[2],"accurate":[3],"phase":[4,31,82,115],"reconstruction":[5],"can":[6],"significantly":[7],"improve":[8,129],"quality.":[10],"While":[11],"phase-aware":[12,60],"enhancement":[14,62,226],"methods":[15],"using":[16],"the":[17,26,30,35,41,47,72,81,88,91,95,119,124,148,161,201,209,220,232],"complex":[18,67],"ideal":[19],"ratio":[20,122],"mask":[21],"(cIRM)":[22],"have":[23],"shown":[24],"promise,":[25],"estimation":[27,73,105,207],"difficulty":[28],"of":[29,40,74,97,142,152,186,190,197],"is":[32,234],"shared":[33],"with":[34,90,107,176],"real":[36],"and":[37,76,80,93,113,192],"imaginary":[38,48],"parts":[39],"cIRM.":[42],"The":[43],"pattern":[44],"lacking":[45],"in":[46,123],"part":[49],"poses":[50],"particular":[51],"difficulties.":[52],"To":[53,127],"address":[54],"this":[55],"issue,":[56],"we":[57,132],"proposed":[58,221],"a":[59,66,103,108,114,134,139,183],"method":[63,101,159,181,203],"that":[64,117,137,218],"uses":[65,102,138],"Wiener":[68],"filter,":[69],"which":[70],"delegates":[71],"noise":[77],"amplitude":[78],"properties":[79],"property":[83],"to":[84,172],"different":[85],"models,":[86],"mitigating":[87],"issues":[89],"cIRM":[92,206],"improving":[94],"effectiveness":[96],"neural-network":[98],"training.":[99],"Our":[100,180,214],"speech-variance":[104,130],"model":[106],"noise-robust":[109],"vector-quantized":[110],"variational":[111],"autoencoder":[112],"corrector":[116],"maximizes":[118],"scale-invariant":[120],"signal-to-noise":[121],"time":[125],"domain.":[126],"further":[128],"estimation,":[131],"propose":[133],"loss":[135,222],"function":[136,223],"categorical":[140],"distribution":[141],"fundamental":[143],"frequency":[144],"(F0)":[145],"for":[146,224],"enhancing":[147],"spectral":[149],"fine":[150],"structure":[151],"estimated":[153],"variance.":[155],"We":[156],"evaluated":[157],"our":[158],"on":[160,205],"open":[162],"dataset":[163],"released":[164],"by":[165],"Valentini":[166],"<italic":[167],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[168],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">et":[169],"al</i>":[170],".":[171],"directly":[173],"compare":[174],"it":[175],"other":[177],"speech-enhancement":[178],"methods.":[179],"achieved":[182],"perceptual":[184],"evaluation":[185],"quality":[188],"score":[189,196],"2.86":[191],"short-time":[193],"objective":[194],"intelligibility":[195],"0.94,":[198],"better":[199],"than":[200],"state-of-the-art":[202],"based":[204],"during":[208],"2020":[210],"Deep":[211],"Noise":[212],"Challenge.":[213],"comprehensive":[215],"analysis":[216],"shows":[217],"incorporating":[219],"spectral-fine-structure":[225],"improves":[227],"quality,":[229],"especially":[230],"when":[231],"F0":[233],"low.":[235]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
