{"id":"https://openalex.org/W4408355634","doi":"https://doi.org/10.1109/icassp49660.2025.10889525","title":"Mamba-SEUNet: Mamba UNet for Monaural Speech Enhancement","display_name":"Mamba-SEUNet: Mamba UNet for Monaural Speech Enhancement","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355634","doi":"https://doi.org/10.1109/icassp49660.2025.10889525"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10889525","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889525","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100612117","display_name":"Junyu Wang","orcid":"https://orcid.org/0000-0001-5096-9598"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junyu Wang","raw_affiliation_strings":["Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zizhen Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zizhen Lin","raw_affiliation_strings":["Sichuan University,School of Electronic Information,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sichuan University,School of Electronic Information,China","institution_ids":["https://openalex.org/I24185976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106558173","display_name":"Tianrui Wang","orcid":"https://orcid.org/0000-0002-2765-5889"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianrui Wang","raw_affiliation_strings":["Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103107663","display_name":"Meng Ge","orcid":"https://orcid.org/0000-0003-4251-0482"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Ge","raw_affiliation_strings":["Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050763764","display_name":"Longbiao Wang","orcid":"https://orcid.org/0000-0002-4005-5036"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longbiao Wang","raw_affiliation_strings":["Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin University,Laboratory of Cognitive Computing and Application, College of Intelligence and Computing,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017251198","display_name":"Jianwu Dang","orcid":"https://orcid.org/0000-0002-9237-4821"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwu Dang","raw_affiliation_strings":["Chinese Academy of Sciences,Shenzhen Institute of Advanced Technology,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Shenzhen Institute of Advanced Technology,China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100612117"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":9.4697,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.98192526,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9502999782562256,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9077000021934509,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.669951319694519},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5245469212532043},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4371260106563568},{"id":"https://openalex.org/keywords/audiology","display_name":"Audiology","score":0.35762691497802734},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.09225967526435852}],"concepts":[{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.669951319694519},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5245469212532043},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4371260106563568},{"id":"https://openalex.org/C548259974","wikidata":"https://www.wikidata.org/wiki/Q569965","display_name":"Audiology","level":1,"score":0.35762691497802734},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.09225967526435852}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10889525","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889525","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1901129140","https://openalex.org/W2094721231","https://openalex.org/W2141998673","https://openalex.org/W2603567530","https://openalex.org/W2921144622","https://openalex.org/W2950635152","https://openalex.org/W2952218014","https://openalex.org/W2963446712","https://openalex.org/W3015197852","https://openalex.org/W3097945073","https://openalex.org/W3158779859","https://openalex.org/W3161950572","https://openalex.org/W3197912330","https://openalex.org/W3206809722","https://openalex.org/W4221143458","https://openalex.org/W4225298533","https://openalex.org/W4225309689","https://openalex.org/W4232282348","https://openalex.org/W4296068416","https://openalex.org/W4296069347","https://openalex.org/W4296070381","https://openalex.org/W4385807442","https://openalex.org/W4385822368","https://openalex.org/W4385822478","https://openalex.org/W4385823378","https://openalex.org/W4390872931","https://openalex.org/W4402112274","https://openalex.org/W4402112631","https://openalex.org/W4406461266","https://openalex.org/W6696884364","https://openalex.org/W6739901393","https://openalex.org/W6757817989","https://openalex.org/W6767440493","https://openalex.org/W6803444062","https://openalex.org/W6859298233","https://openalex.org/W6861387779","https://openalex.org/W6862087182","https://openalex.org/W6863679278","https://openalex.org/W6869952813"],"related_works":["https://openalex.org/W193150574","https://openalex.org/W9415986","https://openalex.org/W1987460062","https://openalex.org/W34801070","https://openalex.org/W1967392028","https://openalex.org/W2129538847","https://openalex.org/W2164958657","https://openalex.org/W4200066910","https://openalex.org/W2393220202","https://openalex.org/W2075894011"],"abstract_inverted_index":{"In":[0,62],"recent":[1],"speech":[2,90],"enhancement":[3],"(SE)":[4],"research,":[5],"transformer":[6],"and":[7,45,57,86,95],"its":[8,50],"variants":[9],"have":[10],"emerged":[11],"as":[12,31],"the":[13,17,21,112,132,140],"predominant":[14],"methodologies.":[15],"However,":[16],"quadratic":[18],"complexity":[19],"of":[20,89,122],"self-attention":[22],"mechanism":[23],"imposes":[24],"certain":[25],"limitations":[26],"on":[27,111],"practical":[28],"deployment.":[29],"Mamba,":[30],"a":[32,119],"novel":[33],"state-space":[34],"model":[35,84],"(SSM),":[36],"has":[37],"gained":[38],"widespread":[39],"application":[40],"in":[41,53],"natural":[42],"language":[43],"processing":[44],"computer":[46],"vision":[47],"due":[48],"to":[49,83,99,143],"strong":[51],"capabilities":[52],"modeling":[54],"long":[55],"sequences":[56],"relatively":[58],"low":[59,126],"computational":[60,127],"complexity.":[61,128],"this":[63],"work,":[64],"we":[65],"introduce":[66],"Mamba-SEUNet,":[67],"an":[68],"innovative":[69],"architecture":[70],"that":[71,116],"integrates":[72],"Mamba":[73,82],"with":[74,131],"U-Net":[75],"for":[76],"SE":[77],"tasks.":[78],"By":[79],"leveraging":[80],"bidirectional":[81],"forward":[85],"backward":[87],"dependencies":[88],"signals":[91],"at":[92],"different":[93],"resolutions,":[94],"incorporating":[96],"skip":[97],"connections":[98],"capture":[100],"multi-scale":[101],"information,":[102],"our":[103],"approach":[104],"achieves":[105],"state-of-the-art":[106],"(SOTA)":[107],"performance.":[108],"Experimental":[109],"results":[110],"VCTK+DEMAND":[113],"dataset":[114],"indicate":[115],"Mamba-SEUNet":[117,137],"attains":[118],"PESQ":[120,141],"score":[121,142],"3.59,":[123],"while":[124],"maintaining":[125],"When":[129],"combined":[130],"Perceptual":[133],"Contrast":[134],"Stretching":[135],"technique,":[136],"further":[138],"improves":[139],"3.73.":[144]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":3}],"updated_date":"2026-05-14T08:36:36.166977","created_date":"2025-10-10T00:00:00"}
