{"id":"https://openalex.org/W4372260572","doi":"https://doi.org/10.1109/icassp49357.2023.10095230","title":"Deformable Temporal Convolutional Networks for Monaural Noisy Reverberant Speech Separation","display_name":"Deformable Temporal Convolutional Networks for Monaural Noisy Reverberant Speech Separation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372260572","doi":"https://doi.org/10.1109/icassp49357.2023.10095230"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10095230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004802529","display_name":"William Ravenscroft","orcid":"https://orcid.org/0000-0002-0780-3303"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"William Ravenscroft","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027797344","display_name":"Stefan Goetze","orcid":"https://orcid.org/0000-0003-1044-7343"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Stefan Goetze","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030528300","display_name":"Thomas Hain","orcid":"https://orcid.org/0000-0003-0939-3464"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Thomas Hain","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004802529"],"corresponding_institution_ids":["https://openalex.org/I91136226"],"apc_list":null,"apc_paid":null,"fwci":2.2743,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.88711854,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.7195614576339722},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7133826613426208},{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.6647985577583313},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6411305665969849},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6301963329315186},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6169662475585938},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.502793550491333},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.47671645879745483},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4369376003742218},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.43650802969932556},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.43593552708625793},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.4353299140930176},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3509605824947357},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2511700987815857},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.2295750379562378},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.114723801612854},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10869967937469482},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09557527303695679}],"concepts":[{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.7195614576339722},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7133826613426208},{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.6647985577583313},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6411305665969849},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6301963329315186},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6169662475585938},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.502793550491333},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.47671645879745483},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4369376003742218},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.43650802969932556},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.43593552708625793},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.4353299140930176},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3509605824947357},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2511700987815857},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.2295750379562378},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.114723801612854},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10869967937469482},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09557527303695679},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10095230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5899999737739563,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320307785","display_name":"3M","ror":"https://ror.org/00mgss748"},{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W70181719","https://openalex.org/W1552314771","https://openalex.org/W2125114513","https://openalex.org/W2221409856","https://openalex.org/W2334904945","https://openalex.org/W2516001803","https://openalex.org/W2531409750","https://openalex.org/W2601564443","https://openalex.org/W2734774145","https://openalex.org/W2952218014","https://openalex.org/W2962715207","https://openalex.org/W2962935966","https://openalex.org/W2996969697","https://openalex.org/W3015191643","https://openalex.org/W3015636705","https://openalex.org/W3015788098","https://openalex.org/W3086154751","https://openalex.org/W3099330747","https://openalex.org/W3110857032","https://openalex.org/W3150964372","https://openalex.org/W3163652268","https://openalex.org/W3167533889","https://openalex.org/W3185109982","https://openalex.org/W3191469971","https://openalex.org/W3213661887","https://openalex.org/W4224938485","https://openalex.org/W4280557595","https://openalex.org/W4283727958","https://openalex.org/W4296068774","https://openalex.org/W4312257080","https://openalex.org/W4312580459","https://openalex.org/W6702735670"],"related_works":["https://openalex.org/W2621851636","https://openalex.org/W2103031592","https://openalex.org/W1967226023","https://openalex.org/W2538939196","https://openalex.org/W3045520545","https://openalex.org/W3150394233","https://openalex.org/W2120771489","https://openalex.org/W2051376034","https://openalex.org/W2955597484","https://openalex.org/W3110551121"],"abstract_inverted_index":{"Speech":[0],"separation":[1,31,50,156],"models":[2,16,37,56,102,120],"are":[3,121],"used":[4],"for":[5,48,114],"isolating":[6],"individual":[7],"speakers":[8],"in":[9,68],"many":[10],"speech":[11,30,49,69,87,116],"processing":[12],"applications.":[13],"Deep":[14],"learning":[15],"have":[17,60,104],"been":[18],"shown":[19,45,72],"to":[20,22,99,103,110,158],"lead":[21],"state-of-the-art":[23],"(SOTA)":[24],"results":[25,47],"on":[26,138],"a":[27,61,78,97],"number":[28],"of":[29,36,54,77,85,123,148],"benchmarks.":[32],"One":[33],"such":[34],"class":[35],"known":[38],"as":[39,96],"temporal":[40],"convolutional":[41],"networks":[42],"(TCNs)":[43],"has":[44,71],"promising":[46],"tasks.":[51],"A":[52,142],"limitation":[53],"these":[55],"is":[57,94,151],"that":[58,73,107],"they":[59],"fixed":[62],"receptive":[63],"field":[64],"(RF).":[65],"Recent":[66],"research":[67],"dereverberation":[70],"the":[74,82,86,135,139],"optimal":[75],"RF":[76],"TCN":[79,101,146],"varies":[80],"with":[81],"reverberation":[83,112],"characteristics":[84],"signal.":[88],"In":[89],"this":[90],"work":[91],"deformable":[92,145],"convolution":[93],"proposed":[95,119,152],"solution":[98],"allow":[100],"dynamic":[105],"RFs":[106],"can":[108],"adapt":[109],"various":[111],"times":[113],"reverberant":[115],"separation.":[117],"The":[118],"capable":[122],"achieving":[124],"an":[125],"11.1":[126],"dB":[127],"average":[128],"scale-invariant":[129],"signal-to-distortion":[130],"ratio":[131],"(SISDR)":[132],"improvement":[133],"over":[134],"input":[136],"signal":[137],"WHAMR":[140],"benchmark.":[141],"relatively":[143],"small":[144],"model":[147],"1.3M":[149],"parameters":[150],"which":[153],"gives":[154],"comparable":[155],"performance":[157],"larger":[159],"and":[160],"more":[161],"computationally":[162],"complex":[163],"models.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
