{"id":"https://openalex.org/W4408355435","doi":"https://doi.org/10.1109/icassp49660.2025.10890458","title":"Dynamic Frequency-Adaptive Knowledge Distillation for Speech Enhancement","display_name":"Dynamic Frequency-Adaptive Knowledge Distillation for Speech Enhancement","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355435","doi":"https://doi.org/10.1109/icassp49660.2025.10890458"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890458","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890458","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053766627","display_name":"Xinyu Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xihao Yuan","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100390236","display_name":"Siqi Liu","orcid":"https://orcid.org/0000-0002-4675-5498"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siqi Liu","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081216284","display_name":"Hanting Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanting Chen","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100388562","display_name":"Lu Zhou","orcid":"https://orcid.org/0000-0001-6804-3865"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Zhou","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083878190","display_name":"Li Jian","orcid":"https://orcid.org/0000-0001-7544-5344"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Li","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5104107845","display_name":"Jie Hu","orcid":"https://orcid.org/0000-0003-2067-5403"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Hu","raw_affiliation_strings":["Huawei,Noah&#x2019;s Ark Lab,China"],"affiliations":[{"raw_affiliation_string":"Huawei,Noah&#x2019;s Ark Lab,China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5053766627"],"corresponding_institution_ids":["https://openalex.org/I2250955327"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05806182,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9506000280380249,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9484000205993652,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.6669809818267822},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6645751595497131},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.49885058403015137},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.48574429750442505},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27775073051452637},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06092563271522522},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.059035927057266235}],"concepts":[{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.6669809818267822},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6645751595497131},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.49885058403015137},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.48574429750442505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27775073051452637},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06092563271522522},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.059035927057266235},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890458","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890458","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2013912476","https://openalex.org/W2603567530","https://openalex.org/W2739879705","https://openalex.org/W2889442120","https://openalex.org/W2952218014","https://openalex.org/W2962851801","https://openalex.org/W2964111476","https://openalex.org/W2982157312","https://openalex.org/W2986015886","https://openalex.org/W3007063652","https://openalex.org/W3031505850","https://openalex.org/W3096408984","https://openalex.org/W3096893582","https://openalex.org/W3097906045","https://openalex.org/W3108075360","https://openalex.org/W3174102142","https://openalex.org/W4226185896","https://openalex.org/W4319586676","https://openalex.org/W4385822385","https://openalex.org/W6738957339","https://openalex.org/W6748082341","https://openalex.org/W6751528251","https://openalex.org/W6757639898","https://openalex.org/W6767584280"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W3096184950","https://openalex.org/W4231424160"],"abstract_inverted_index":{"Deep":[0],"learning-based":[1],"speech":[2],"enhancement":[3],"(SE)":[4],"models":[5],"have":[6],"recently":[7],"outperformed":[8],"traditional":[9],"techniques,":[10],"yet":[11],"their":[12],"deployment":[13],"on":[14,70,84],"resource-constrained":[15],"devices":[16],"remains":[17],"challenging":[18],"due":[19],"to":[20,37,60],"high":[21,51],"computational":[22],"and":[23,52,55,90],"memory":[24],"demands.":[25],"This":[26],"paper":[27],"introduces":[28],"a":[29],"novel":[30],"dynamic":[31],"frequency-adaptive":[32],"knowledge":[33,115],"distillation":[34,116],"(DFKD)":[35],"approach":[36],"effectively":[38],"compress":[39],"SE":[40,72,120],"models.":[41],"Our":[42],"method":[43,97],"dynamically":[44],"assesses":[45],"the":[46,57,62,71,78,102,105],"model\u2019s":[47],"output,":[48],"distinguishing":[49],"between":[50],"low-frequency":[53],"components,":[54],"adapts":[56],"learning":[58],"objectives":[59],"meet":[61],"unique":[63],"requirements":[64],"of":[65,104],"different":[66],"frequency":[67],"bands,":[68],"capitalizing":[69],"task\u2019s":[73],"inherent":[74],"characteristics.":[75],"To":[76],"evaluate":[77],"DFKD\u2019s":[79],"efficacy,":[80],"we":[81],"conducted":[82],"experiments":[83],"three":[85],"state-of-the-art":[86],"models:":[87],"DCCRN,":[88],"ConTasNet,":[89],"DPTNet.":[91],"The":[92],"results":[93],"demonstrate":[94],"that":[95],"our":[96],"not":[98],"only":[99],"significantly":[100],"enhances":[101],"performance":[103],"compressed":[106],"model":[107],"(student":[108],"model)":[109],"but":[110],"also":[111],"surpasses":[112],"other":[113],"logit-based":[114],"methods":[117],"specifically":[118],"for":[119],"tasks.":[121]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
