{"id":"https://openalex.org/W3160973314","doi":"https://doi.org/10.1109/icassp39728.2021.9413967","title":"Densely Connected Multi-Stage Model with Channel Wise Subband Feature for Real-Time Speech Enhancement","display_name":"Densely Connected Multi-Stage Model with Channel Wise Subband Feature for Real-Time Speech Enhancement","publication_year":2021,"publication_date":"2021-05-13","ids":{"openalex":"https://openalex.org/W3160973314","doi":"https://doi.org/10.1109/icassp39728.2021.9413967","mag":"3160973314"},"language":"en","primary_location":{"id":"doi:10.1109/icassp39728.2021.9413967","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp39728.2021.9413967","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100642253","display_name":"Jingdong Li","orcid":"https://orcid.org/0000-0003-2335-6280"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingdong Li","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101954584","display_name":"Dawei Luo","orcid":"https://orcid.org/0009-0000-1875-0262"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dawei Luo","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100657451","display_name":"Yun Liu","orcid":"https://orcid.org/0000-0002-2861-0316"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Liu","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101860834","display_name":"Yuanyuan Zhu","orcid":"https://orcid.org/0000-0002-3422-8017"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyuan Zhu","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380854","display_name":"Zhaoxia Li","orcid":"https://orcid.org/0000-0002-8045-6176"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaoxia Li","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064776161","display_name":"Guohui Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guohui Cui","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101954684","display_name":"Wenqi Tang","orcid":"https://orcid.org/0000-0002-0379-7081"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenqi Tang","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100344582","display_name":"Wei Chen","orcid":"https://orcid.org/0000-0003-3720-718X"},"institutions":[{"id":"https://openalex.org/I4210134178","display_name":"Sohu (China)","ror":"https://ror.org/02sfdh709","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210134178"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Chen","raw_affiliation_strings":["AI Interaction Division, Sogou Inc, Beijing, China"],"affiliations":[{"raw_affiliation_string":"AI Interaction Division, Sogou Inc, Beijing, China","institution_ids":["https://openalex.org/I4210134178"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100642253"],"corresponding_institution_ids":["https://openalex.org/I4210134178"],"apc_list":null,"apc_paid":null,"fwci":1.676,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.84144692,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"6638","last_page":"6642"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8310893774032593},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.7670527696609497},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7352484464645386},{"id":"https://openalex.org/keywords/mean-opinion-score","display_name":"Mean opinion score","score":0.6433196663856506},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.612017810344696},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5566674470901489},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.45097655057907104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40203580260276794}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8310893774032593},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.7670527696609497},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7352484464645386},{"id":"https://openalex.org/C62897895","wikidata":"https://www.wikidata.org/wiki/Q1915482","display_name":"Mean opinion score","level":3,"score":0.6433196663856506},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.612017810344696},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5566674470901489},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.45097655057907104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40203580260276794},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp39728.2021.9413967","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp39728.2021.9413967","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1482149378","https://openalex.org/W2044893557","https://openalex.org/W2117678320","https://openalex.org/W2291877678","https://openalex.org/W2603567530","https://openalex.org/W2889442120","https://openalex.org/W2891433113","https://openalex.org/W2894785362","https://openalex.org/W2940275453","https://openalex.org/W2952218014","https://openalex.org/W2962866211","https://openalex.org/W2963045393","https://openalex.org/W2963103134","https://openalex.org/W2963727650","https://openalex.org/W2991361823","https://openalex.org/W2998657200","https://openalex.org/W3084645150","https://openalex.org/W3094893721","https://openalex.org/W3096408984","https://openalex.org/W3099330747","https://openalex.org/W3163464523"],"related_works":["https://openalex.org/W1600259599","https://openalex.org/W2770593030","https://openalex.org/W4281727072","https://openalex.org/W4312219546","https://openalex.org/W2013629269","https://openalex.org/W2139455842","https://openalex.org/W4287113595","https://openalex.org/W3176271478","https://openalex.org/W3162422176","https://openalex.org/W2059407125"],"abstract_inverted_index":{"Research":[0],"on":[1],"single":[2],"channel":[3],"speech":[4,65,82,153],"enhancement":[5,25,38,66],"(SE)":[6],"has":[7],"a":[8,61,141],"long":[9],"tradition,":[10],"but":[11],"two":[12],"main":[13],"practical":[14],"problems":[15],"still":[16],"remain":[17],"unsolved.":[18],"Firstly,":[19],"it\u2019s":[20],"hard":[21],"to":[22,88,97,100,107,113,166],"balance":[23],"between":[24],"quality":[26,154],"and":[27,30,45,116,155],"computational":[28],"efficiency,":[29],"low-latency":[31],"always":[32],"brings":[33],"loss":[34],"of":[35,53,92,130,152,196],"quality.":[36],"Secondly,":[37],"in":[39,95,111,150,158,194],"specific":[40,131],"scenarios,":[41,132],"such":[42],"as":[43],"singing":[44],"emotional":[46],"speech,":[47],"is":[48,86,105,124],"also":[49],"an":[50,120],"intricate":[51],"problem":[52],"conventional":[54],"methods.":[55],"In":[56,182],"this":[57],"paper,":[58],"we":[59],"propose":[60],"computationally":[62],"efficient":[63],"real-time":[64,174],"network":[67],"with":[68,126],"densely":[69],"connected":[70],"multi-stage":[71],"structures,":[72],"which":[73,133,177],"progressively":[74],"enhances":[75],"the":[76,90,143,163,167,183],"channel-wise":[77],"subband":[78],"speech.":[79],"The":[80],"enhanced":[81],"from":[83],"earlier":[84],"stage":[85,94],"used":[87],"guide":[89],"processing":[91],"deeper":[93],"order":[96,112],"obtain":[98],"coarse":[99],"fine":[101],"estimations.":[102],"Besides,":[103],"supervision":[104],"applied":[106],"all":[108],"intermediate":[109],"results":[110],"stabilize":[114],"training":[115],"accelerate":[117],"convergence.":[118],"Moreover,":[119],"adaptive":[121],"fine-tune":[122],"step":[123],"utilized":[125],"some":[127],"small":[128],"datasets":[129],"achieves":[134,146],"superb":[135],"improvement":[136],"under":[137],"corresponding":[138],"scenes.":[139],"As":[140],"result,":[142],"proposed":[144,164],"method":[145,165],"promising":[147],"performance":[148],"improvements":[149],"terms":[151,195],"demonstrates":[156],"robustness":[157],"complex":[159],"scenarios.":[160],"We":[161],"submitt":[162],"deep":[168],"noise":[169],"suppression":[170],"(DNS)":[171],"challenge":[172],"2021,":[173],"denoising":[175],"track,":[176],"was":[178],"held":[179],"by":[180,191],"Microsoft.":[181],"subjective":[184],"evaluation,":[185],"our":[186],"system":[187],"outperforms":[188],"DNS-Challenge":[189],"baseline":[190],"0.14":[192],"points":[193],"mean":[197],"opinion":[198],"score":[199],"(MOS).":[200]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
