{"id":"https://openalex.org/W4312257080","doi":"https://doi.org/10.1109/iwaenc53105.2022.9914752","title":"Utterance Weighted Multi-Dilation Temporal Convolutional Networks for Monaural Speech Dereverberation","display_name":"Utterance Weighted Multi-Dilation Temporal Convolutional Networks for Monaural Speech Dereverberation","publication_year":2022,"publication_date":"2022-09-05","ids":{"openalex":"https://openalex.org/W4312257080","doi":"https://doi.org/10.1109/iwaenc53105.2022.9914752"},"language":"en","primary_location":{"id":"doi:10.1109/iwaenc53105.2022.9914752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwaenc53105.2022.9914752","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Workshop on Acoustic Signal Enhancement (IWAENC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004802529","display_name":"William Ravenscroft","orcid":"https://orcid.org/0000-0002-0780-3303"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"William Ravenscroft","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027797344","display_name":"Stefan Goetze","orcid":"https://orcid.org/0000-0003-1044-7343"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Stefan Goetze","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030528300","display_name":"Thomas Hain","orcid":"https://orcid.org/0000-0003-0939-3464"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Thomas Hain","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004802529"],"corresponding_institution_ids":["https://openalex.org/I91136226"],"apc_list":null,"apc_paid":null,"fwci":1.1905,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.78299343,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9700999855995178,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.749672532081604},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6642693877220154},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6585841178894043},{"id":"https://openalex.org/keywords/dilation","display_name":"Dilation (metric space)","score":0.6128777265548706},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6034818887710571},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5669141411781311},{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.47446662187576294},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4130796492099762},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38475072383880615},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3760460913181305},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2085767686367035},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1476472020149231}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.749672532081604},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6642693877220154},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6585841178894043},{"id":"https://openalex.org/C2780757906","wikidata":"https://www.wikidata.org/wiki/Q5276676","display_name":"Dilation (metric space)","level":2,"score":0.6128777265548706},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6034818887710571},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5669141411781311},{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.47446662187576294},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4130796492099762},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38475072383880615},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3760460913181305},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2085767686367035},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1476472020149231},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iwaenc53105.2022.9914752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwaenc53105.2022.9914752","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Workshop on Acoustic Signal Enhancement (IWAENC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W187699606","https://openalex.org/W1552314771","https://openalex.org/W1598327410","https://openalex.org/W1677182931","https://openalex.org/W1820182450","https://openalex.org/W2035412504","https://openalex.org/W2516001803","https://openalex.org/W2747732471","https://openalex.org/W2752782242","https://openalex.org/W2937484199","https://openalex.org/W2952218014","https://openalex.org/W2963941778","https://openalex.org/W2964058413","https://openalex.org/W2982471419","https://openalex.org/W3007256793","https://openalex.org/W3015191643","https://openalex.org/W3026111682","https://openalex.org/W3034421924","https://openalex.org/W3086154751","https://openalex.org/W3096159803","https://openalex.org/W3097056996","https://openalex.org/W3099330747","https://openalex.org/W3134202725","https://openalex.org/W3145364388","https://openalex.org/W3167533889","https://openalex.org/W3198661668","https://openalex.org/W3204647170","https://openalex.org/W3215005424","https://openalex.org/W4280557595","https://openalex.org/W4312580459","https://openalex.org/W4312959668","https://openalex.org/W6744955691"],"related_works":["https://openalex.org/W3156786002","https://openalex.org/W2738221750","https://openalex.org/W2606416966","https://openalex.org/W2732542196","https://openalex.org/W564581980","https://openalex.org/W3165266428","https://openalex.org/W3186111093","https://openalex.org/W4214561993","https://openalex.org/W2574739773","https://openalex.org/W3129634582"],"abstract_inverted_index":{"Speech":[0],"dereverberation":[1],"is":[2,53,90,113,140],"an":[3],"important":[4],"stage":[5],"in":[6,13,39,60,78,86],"many":[7],"speech":[8],"technology":[9],"applications.":[10],"Recent":[11],"work":[12,47],"this":[14,46,93],"area":[15],"has":[16],"been":[17,34],"dominated":[18],"by":[19],"deep":[20,29],"neural":[21],"network":[22,98],"models.":[23,62],"Temporal":[24],"convolutional":[25,84,97,130],"networks":[26],"(TCNs)":[27],"are":[28],"learning":[30],"models":[31],"that":[32,92],"have":[33],"proposed":[35,54,64],"for":[36],"sequence":[37],"modelling":[38],"the":[40,67,87,102,110,120,123,127,137,148,158],"task":[41],"of":[42,122,129],"dereverberating":[43],"speech.":[44],"In":[45],"a":[48,114],"weighted":[49,94],"multi-dilation":[50,95],"depthwise-separable":[51,58],"convolution":[52,65],"to":[55,69,118],"replace":[56],"standard":[57],"convolutions":[59],"TCN":[61,68,103,139],"This":[63],"enables":[66],"dynamically":[70],"focus":[71],"on":[72,157],"more":[73,115],"or":[74],"less":[75],"local":[76],"information":[77],"its":[79],"receptive":[80],"field":[81],"at":[82],"each":[83],"block":[85],"network.":[88],"It":[89],"shown":[91],"temporal":[96],"(WD-TCN)":[99],"consistently":[100],"outperforms":[101],"across":[104],"various":[105],"model":[106,112,124,152],"configurations":[107],"and":[108,147],"using":[109],"WD-TCN":[111,151],"parameter-efficient":[116],"method":[117],"improve":[119],"performance":[121,134],"than":[125],"increasing":[126],"number":[128],"blocks.":[131],"The":[132],"best":[133,149],"improvement":[135],"over":[136],"baseline":[138],"0.55":[141],"dB":[142,155],"scale-invariant":[143],"signal-to-distortion":[144],"ratio":[145],"(SISDR)":[146],"performing":[150],"attains":[153],"12.26":[154],"SISDR":[156],"WHAMR":[159],"dataset.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
