{"id":"https://openalex.org/W3138670565","doi":"https://doi.org/10.1109/taslp.2021.3067154","title":"TAU-Net: Temporal Activation U-Net Shared With Nonnegative Matrix Factorization for Speech Enhancement in Unseen Noise Environments","display_name":"TAU-Net: Temporal Activation U-Net Shared With Nonnegative Matrix Factorization for Speech Enhancement in Unseen Noise Environments","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3138670565","doi":"https://doi.org/10.1109/taslp.2021.3067154","mag":"3138670565"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3067154","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3067154","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041277364","display_name":"Kwang Myung Jeon","orcid":"https://orcid.org/0000-0003-2810-3063"},"institutions":[{"id":"https://openalex.org/I4210120602","display_name":"Advanced Institute of Convergence Technology","ror":"https://ror.org/01w62yz22","country_code":"KR","type":"facility","lineage":["https://openalex.org/I139264467","https://openalex.org/I4210120602"]},{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Kwang Myung Jeon","raw_affiliation_strings":["AI Convergence Technology Laboratory, Intflow Inc., Gwangju, Korea","Gwangju Institute of Science and Technology, Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"AI Convergence Technology Laboratory, Intflow Inc., Gwangju, Korea","institution_ids":["https://openalex.org/I4210120602"]},{"raw_affiliation_string":"Gwangju Institute of Science and Technology, Gwangju, Korea","institution_ids":["https://openalex.org/I39534123"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028537246","display_name":"Geon Woo Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Geon Woo Lee","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology (GIST), Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology (GIST), Gwangju, Korea","institution_ids":["https://openalex.org/I39534123"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067154795","display_name":"Nam Kyun Kim","orcid":"https://orcid.org/0000-0001-6923-230X"},"institutions":[{"id":"https://openalex.org/I4210095514","display_name":"Korea Automotive Technology Institute","ror":"https://ror.org/00sc3t321","country_code":"KR","type":"facility","lineage":["https://openalex.org/I4210095514"]},{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Nam Kyun Kim","raw_affiliation_strings":["Gwangju Institute of Science and Technology (GIST)., Automotive Electronics R&D Center, Korea Automotive Technology Institute (KATECH), Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"Gwangju Institute of Science and Technology (GIST)., Automotive Electronics R&D Center, Korea Automotive Technology Institute (KATECH), Gwangju, Korea","institution_ids":["https://openalex.org/I4210095514","https://openalex.org/I39534123"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085604883","display_name":"Hong Kook Kim","orcid":"https://orcid.org/0000-0002-0105-6693"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hong Kook Kim","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology (GIST), Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology (GIST), Gwangju, Korea","institution_ids":["https://openalex.org/I39534123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5041277364"],"corresponding_institution_ids":["https://openalex.org/I39534123","https://openalex.org/I4210120602"],"apc_list":null,"apc_paid":null,"fwci":0.9142,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.72988506,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"29","issue":null,"first_page":"3400","last_page":"3414"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.865562915802002},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7437082529067993},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5829603672027588},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.49703267216682434},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.48421549797058105},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4809214770793915},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.480183482170105},{"id":"https://openalex.org/keywords/net","display_name":"Net (polyhedron)","score":0.47883203625679016},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.4666191637516022},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.42843982577323914},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3688962459564209},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.23778969049453735},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1604577600955963},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.1456322968006134}],"concepts":[{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.865562915802002},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7437082529067993},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5829603672027588},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.49703267216682434},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.48421549797058105},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4809214770793915},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.480183482170105},{"id":"https://openalex.org/C14166107","wikidata":"https://www.wikidata.org/wiki/Q253829","display_name":"Net (polyhedron)","level":2,"score":0.47883203625679016},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.4666191637516022},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.42843982577323914},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3688962459564209},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.23778969049453735},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1604577600955963},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.1456322968006134},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3067154","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3067154","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7699999809265137}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1569068623","https://openalex.org/W1635512741","https://openalex.org/W1790748249","https://openalex.org/W1901129140","https://openalex.org/W1974387177","https://openalex.org/W1983108229","https://openalex.org/W1987097504","https://openalex.org/W1997528538","https://openalex.org/W2013608223","https://openalex.org/W2044893557","https://openalex.org/W2077799289","https://openalex.org/W2078528584","https://openalex.org/W2094721231","https://openalex.org/W2096698681","https://openalex.org/W2111854888","https://openalex.org/W2118718620","https://openalex.org/W2127851351","https://openalex.org/W2134973740","https://openalex.org/W2156448167","https://openalex.org/W2158291955","https://openalex.org/W2168379380","https://openalex.org/W2402901296","https://openalex.org/W2402962867","https://openalex.org/W2405589348","https://openalex.org/W2405774341","https://openalex.org/W2508062474","https://openalex.org/W2513910579","https://openalex.org/W2519994964","https://openalex.org/W2559246505","https://openalex.org/W2559809918","https://openalex.org/W2603567530","https://openalex.org/W2622005144","https://openalex.org/W2661910912","https://openalex.org/W2746457594","https://openalex.org/W2748471249","https://openalex.org/W2760027020","https://openalex.org/W2766672686","https://openalex.org/W2774707525","https://openalex.org/W2791686384","https://openalex.org/W2810535283","https://openalex.org/W2889205417","https://openalex.org/W2937484199","https://openalex.org/W2943554574","https://openalex.org/W2952218014","https://openalex.org/W2962701080","https://openalex.org/W2963103134","https://openalex.org/W2963341071","https://openalex.org/W2963453742","https://openalex.org/W2964121744","https://openalex.org/W2994244075","https://openalex.org/W3099330747","https://openalex.org/W4298642009","https://openalex.org/W6631190155","https://openalex.org/W6637992904","https://openalex.org/W6639824700","https://openalex.org/W6677759377","https://openalex.org/W6713779898","https://openalex.org/W6744787216","https://openalex.org/W6746914816","https://openalex.org/W6844105982"],"related_works":["https://openalex.org/W2127243424","https://openalex.org/W2037504162","https://openalex.org/W2792706544","https://openalex.org/W1568451138","https://openalex.org/W2539013788","https://openalex.org/W2156699640","https://openalex.org/W2045265907","https://openalex.org/W3006480059","https://openalex.org/W2972997031","https://openalex.org/W2900450731"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"a":[3,10,63,67,163],"novel":[4],"speech":[5,81,131,148],"enhancement":[6,149,187],"method":[7,26,86,150,161],"based":[8],"on":[9],"hybrid":[11],"machine-learning":[12],"architecture":[13],"consisting":[14],"of":[15,31,95,127,144,170,181],"U-Net":[16,41,65],"and":[17,42,82,173,192],"nonnegative":[18],"matrix":[19],"factorization":[20],"(NMF)":[21],"is":[22,72,132,151],"proposed.":[23],"The":[24,84,142],"proposed":[25,85,97,146,160],"attempts":[27],"to":[28,45,112,117,138],"take":[29],"advantage":[30],"both":[32],"the":[33,43,59,89,93,96,107,124,139,145,159,182],"accurate":[34],"separation":[35],"for":[36],"known":[37],"noise":[38,156],"environments":[39],"by":[40,48,134],"adaptation":[44],"unseen":[46,118,155],"noises":[47,119],"an":[49,52,100],"NMF":[50,76,101],"with":[51,66,75,102,166],"online":[53,103],"dictionary":[54,104],"learning":[55,105],"technique.":[56],"To":[57],"merge":[58],"two":[60],"different":[61],"architectures,":[62],"modified":[64],"temporal":[68,90,110,136],"activation":[69],"layer":[70],"(TAU-Net)":[71],"jointly":[73],"optimized":[74],"models":[77],"that":[78,120],"represent":[79],"universal":[80],"noise.":[83],"first":[87],"estimates":[88],"activations":[91,111,137],"from":[92],"encoder":[94],"TAU-Net.":[98,128],"Then,":[99],"adjusts":[106],"initially":[108],"given":[109],"suppress":[113],"their":[114],"cross-activations":[115],"due":[116],"are":[121,177],"unknown":[122],"in":[123,153],"training":[125],"phase":[126],"Finally,":[129],"clean":[130],"obtained":[133],"adjusting":[135],"TAU-Net":[140],"decoder.":[141],"effectiveness":[143],"TAU-Net-based":[147],"evaluated":[152],"various":[154],"environments.":[157],"Consequently,":[158],"achieves":[162],"substantial":[164],"improvement":[165],"average":[167],"signal-to-distortion":[168],"ratios":[169],"2.32":[171],"dB":[172],"5.68":[174],"dB,":[175],"which":[176],"higher":[178],"than":[179],"those":[180],"baseline":[183],"methods":[184],"such":[185],"asspeech":[186],"generative":[188],"adversarial":[189],"network":[190],"(SEGAN)":[191],"U-Net,":[193],"respectively.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
