{"id":"https://openalex.org/W4319586580","doi":"https://doi.org/10.1109/iscslp57327.2022.10037937","title":"Optimizing Shoulder to Shoulder: A Coordinated Sub-Band Fusion Model for Full-Band Speech Enhancement","display_name":"Optimizing Shoulder to Shoulder: A Coordinated Sub-Band Fusion Model for Full-Band Speech Enhancement","publication_year":2022,"publication_date":"2022-12-11","ids":{"openalex":"https://openalex.org/W4319586580","doi":"https://doi.org/10.1109/iscslp57327.2022.10037937"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp57327.2022.10037937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp57327.2022.10037937","pdf_url":null,"source":{"id":"https://openalex.org/S4363607181","display_name":"2022 13th International Symposium on Chinese Spoken Language Processing (ISCSLP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025635655","display_name":"Guochen Yu","orcid":"https://orcid.org/0000-0002-7179-1044"},"institutions":[{"id":"https://openalex.org/I4391768176","display_name":"State Key Laboratory of Media Convergence and Communication","ror":"https://ror.org/0595ys057","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391768176","https://openalex.org/I75689368"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guochen Yu","raw_affiliation_strings":["Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","Chinese Academy of Sciences, Institute of Acoustics, Beijing, China","State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","institution_ids":["https://openalex.org/I75689368","https://openalex.org/I4391768176"]},{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Acoustics, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053757616","display_name":"Andong Li","orcid":"https://orcid.org/0000-0003-4094-8448"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Andong Li","raw_affiliation_strings":["Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","Chinese Academy of Sciences, Institute of Acoustics, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Acoustics, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100679522","display_name":"Wenzhe Liu","orcid":"https://orcid.org/0000-0002-0827-6883"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenzhe Liu","raw_affiliation_strings":["Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","Chinese Academy of Sciences, Institute of Acoustics, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Acoustics, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","Chinese Academy of Sciences, Institute of Acoustics, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics,Chinese Academy of Sciences,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Acoustics, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100741276","display_name":"Yutian Wang","orcid":"https://orcid.org/0009-0008-8451-600X"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]},{"id":"https://openalex.org/I4391768176","display_name":"State Key Laboratory of Media Convergence and Communication","ror":"https://ror.org/0595ys057","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391768176","https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutian Wang","raw_affiliation_strings":["Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","institution_ids":["https://openalex.org/I75689368","https://openalex.org/I4391768176"]},{"raw_affiliation_string":"State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100460841","display_name":"Hui Wang","orcid":"https://orcid.org/0000-0002-8476-888X"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]},{"id":"https://openalex.org/I4391768176","display_name":"State Key Laboratory of Media Convergence and Communication","ror":"https://ror.org/0595ys057","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391768176","https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Wang","raw_affiliation_strings":["Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Communication University of China,State Key Laboratory of Media Convergence and Communication,Beijing,China","institution_ids":["https://openalex.org/I75689368","https://openalex.org/I4391768176"]},{"raw_affiliation_string":"State Key Laboratory of Media Convergence and Communication, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5025635655"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210099069","https://openalex.org/I4391768176","https://openalex.org/I75689368"],"apc_list":null,"apc_paid":null,"fwci":0.7355,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.71690363,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"483","last_page":"487"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7816532254219055},{"id":"https://openalex.org/keywords/out-of-band-management","display_name":"Out-of-band management","score":0.6190755367279053},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5761712789535522},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5264830589294434},{"id":"https://openalex.org/keywords/frequency-band","display_name":"Frequency band","score":0.5261266231536865},{"id":"https://openalex.org/keywords/radio-spectrum","display_name":"Radio spectrum","score":0.5235556960105896},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4875127971172333},{"id":"https://openalex.org/keywords/multi-band","display_name":"Multi band","score":0.4872943162918091},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4832930862903595},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4452303647994995},{"id":"https://openalex.org/keywords/multi-band-device","display_name":"Multi-band device","score":0.4253900647163391},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.42273736000061035},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41464096307754517},{"id":"https://openalex.org/keywords/network-architecture","display_name":"Network architecture","score":0.2916800379753113},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.2133629322052002},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.17693600058555603},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.12083566188812256}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7816532254219055},{"id":"https://openalex.org/C43551900","wikidata":"https://www.wikidata.org/wiki/Q1824704","display_name":"Out-of-band management","level":4,"score":0.6190755367279053},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5761712789535522},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5264830589294434},{"id":"https://openalex.org/C2778116611","wikidata":"https://www.wikidata.org/wiki/Q25110567","display_name":"Frequency band","level":3,"score":0.5261266231536865},{"id":"https://openalex.org/C92545706","wikidata":"https://www.wikidata.org/wiki/Q902174","display_name":"Radio spectrum","level":2,"score":0.5235556960105896},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4875127971172333},{"id":"https://openalex.org/C2983672931","wikidata":"https://www.wikidata.org/wiki/Q1756885","display_name":"Multi band","level":3,"score":0.4872943162918091},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4832930862903595},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4452303647994995},{"id":"https://openalex.org/C134546842","wikidata":"https://www.wikidata.org/wiki/Q1756885","display_name":"Multi-band device","level":3,"score":0.4253900647163391},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.42273736000061035},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41464096307754517},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2916800379753113},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.2133629322052002},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.17693600058555603},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.12083566188812256},{"id":"https://openalex.org/C21822782","wikidata":"https://www.wikidata.org/wiki/Q131214","display_name":"Antenna (radio)","level":2,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C16986412","wikidata":"https://www.wikidata.org/wiki/Q918419","display_name":"Network management station","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp57327.2022.10037937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp57327.2022.10037937","pdf_url":null,"source":{"id":"https://openalex.org/S4363607181","display_name":"2022 13th International Symposium on Chinese Spoken Language Processing (ISCSLP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.699999988079071}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W165956390","https://openalex.org/W1522301498","https://openalex.org/W1552314771","https://openalex.org/W1983108229","https://openalex.org/W2067295501","https://openalex.org/W2094721231","https://openalex.org/W2144404214","https://openalex.org/W2603567530","https://openalex.org/W2696967604","https://openalex.org/W2937484199","https://openalex.org/W2952218014","https://openalex.org/W2962866211","https://openalex.org/W2963868408","https://openalex.org/W2991361823","https://openalex.org/W2998161426","https://openalex.org/W3025844872","https://openalex.org/W3026111682","https://openalex.org/W3092864146","https://openalex.org/W3095248373","https://openalex.org/W3096641561","https://openalex.org/W3099330747","https://openalex.org/W3120336970","https://openalex.org/W3161480375","https://openalex.org/W3162493033","https://openalex.org/W3195288392","https://openalex.org/W3197260772","https://openalex.org/W3201698955","https://openalex.org/W3205770165","https://openalex.org/W3206809722","https://openalex.org/W3211438798","https://openalex.org/W3213188934","https://openalex.org/W4221145205","https://openalex.org/W4224928157","https://openalex.org/W4225302959","https://openalex.org/W4225905067","https://openalex.org/W4226370149","https://openalex.org/W4253928870","https://openalex.org/W4296068760","https://openalex.org/W6631190155","https://openalex.org/W6798972960","https://openalex.org/W6803744562","https://openalex.org/W6810708021"],"related_works":["https://openalex.org/W2272022466","https://openalex.org/W2065095951","https://openalex.org/W4388430575","https://openalex.org/W2285135691","https://openalex.org/W2157243748","https://openalex.org/W2956069452","https://openalex.org/W2138402588","https://openalex.org/W4385282352","https://openalex.org/W3036888818","https://openalex.org/W2035243958"],"abstract_inverted_index":{"Due":[0],"to":[1,6,15,39,48,69,90,126],"the":[2,29,41,71,92,103,110,117,139],"high":[3],"computational":[4],"complexity":[5],"model":[7],"more":[8],"frequency":[9,37,133],"bands,":[10],"it":[11],"is":[12,87],"still":[13],"intractable":[14],"conduct":[16],"full-band":[17,42,64,148],"speech":[18,50,65],"enhancement":[19],"based":[20],"on":[21,116],"deep":[22],"neural":[23],"networks.":[24],"Recent":[25],"studies":[26],"typically":[27],"utilize":[28],"compressed":[30],"perceptually":[31],"motivated":[32],"features":[33],"with":[34],"relatively":[35],"low":[36],"resolution":[38],"filter":[40],"spectrum":[43],"by":[44],"one-stage":[45],"networks,":[46],"leading":[47],"limited":[49],"quality":[51],"improvements.":[52],"In":[53],"this":[54],"paper,":[55],"we":[56,120],"propose":[57],"a":[58,80,84,122],"coordinated":[59],"sub-band":[60,123],"fusion":[61],"network":[62,86],"for":[63],"enhancement,":[66],"which":[67],"aims":[68],"recover":[70,91],"low-":[72],"(0-8kHz),":[73],"middle-":[74,104],"(8-16kHz),":[75],"and":[76,96,105],"high-band":[77,106],"(16-24kHz)":[78],"in":[79,109],"step-wise":[81],"manner.":[82],"Specifically,":[83],"dual-stream":[85],"first":[88],"pretrained":[89],"low-band":[93],"complex":[94],"spectrum,":[95],"another":[97],"two":[98],"sub-networks":[99],"are":[100],"designed":[101],"as":[102],"noise":[107],"suppressors":[108],"magnitude-only":[111],"domain.":[112],"To":[113],"fully":[114],"capitalize":[115],"information":[118],"intercommunication,":[119],"employ":[121],"interaction":[124],"module":[125],"provide":[127],"external":[128],"knowledge":[129],"guidance":[130],"across":[131],"different":[132],"bands.":[134],"Extensive":[135],"experiments":[136],"show":[137],"that":[138],"proposed":[140],"method":[141],"yields":[142],"consistent":[143],"performance":[144],"advantages":[145],"over":[146],"state-of-the-art":[147],"baselines.":[149]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
