{"id":"https://openalex.org/W4392904504","doi":"https://doi.org/10.1109/icassp48485.2024.10447644","title":"Combining Conformer and Dual-Path-Transformer Networks for Single Channel Noisy Reverberant Speech Separation","display_name":"Combining Conformer and Dual-Path-Transformer Networks for Single Channel Noisy Reverberant Speech Separation","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392904504","doi":"https://doi.org/10.1109/icassp48485.2024.10447644"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10447644","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10447644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://eprints.whiterose.ac.uk/id/eprint/207516/1/_Will_ICASSP24__Insights_ConSepT%20%282%29.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004802529","display_name":"William Ravenscroft","orcid":"https://orcid.org/0000-0002-0780-3303"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"William Ravenscroft","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027797344","display_name":"Stefan Goetze","orcid":"https://orcid.org/0000-0003-1044-7343"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Stefan Goetze","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030528300","display_name":"Thomas Hain","orcid":"https://orcid.org/0000-0003-0939-3464"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Thomas Hain","raw_affiliation_strings":["The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom"],"affiliations":[{"raw_affiliation_string":"The University of Sheffield,Department of Computer Science,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, The University of Sheffield, Sheffield, United Kingdom","institution_ids":["https://openalex.org/I91136226"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004802529"],"corresponding_institution_ids":["https://openalex.org/I91136226"],"apc_list":null,"apc_paid":null,"fwci":1.7263,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.83676065,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"11491","last_page":"11495"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6564565300941467},{"id":"https://openalex.org/keywords/anechoic-chamber","display_name":"Anechoic chamber","score":0.5858684182167053},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5193703770637512},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4884614050388336},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4304870367050171},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34885743260383606},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07612144947052002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6564565300941467},{"id":"https://openalex.org/C149712133","wikidata":"https://www.wikidata.org/wiki/Q332774","display_name":"Anechoic chamber","level":2,"score":0.5858684182167053},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5193703770637512},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4884614050388336},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4304870367050171},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34885743260383606},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07612144947052002}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp48485.2024.10447644","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10447644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.whiterose.ac.uk:207516","is_oa":true,"landing_page_url":"https://orcid.org/0000-0002-0780-3303>,","pdf_url":"https://eprints.whiterose.ac.uk/id/eprint/207516/1/_Will_ICASSP24__Insights_ConSepT%20%282%29.pdf","source":{"id":"https://openalex.org/S4306400854","display_name":"White Rose Research Online (University of Leeds, The University of Sheffield, University of York)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2800616092","host_organization_name":"White Rose University Consortium","host_organization_lineage":["https://openalex.org/I2800616092"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"pmh:oai:eprints.whiterose.ac.uk:207516","is_oa":true,"landing_page_url":"https://orcid.org/0000-0002-0780-3303>,","pdf_url":"https://eprints.whiterose.ac.uk/id/eprint/207516/1/_Will_ICASSP24__Insights_ConSepT%20%282%29.pdf","source":{"id":"https://openalex.org/S4306400854","display_name":"White Rose Research Online (University of Leeds, The University of Sheffield, University of York)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2800616092","host_organization_name":"White Rose University Consortium","host_organization_lineage":["https://openalex.org/I2800616092"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320338440","display_name":"HORIZON EUROPE Health","ror":null}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392904504.pdf"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W70181719","https://openalex.org/W1552314771","https://openalex.org/W2100471625","https://openalex.org/W2106272332","https://openalex.org/W2125114513","https://openalex.org/W2147166770","https://openalex.org/W2516001803","https://openalex.org/W2564013664","https://openalex.org/W2734774145","https://openalex.org/W2952218014","https://openalex.org/W2962715207","https://openalex.org/W2962935966","https://openalex.org/W2982471419","https://openalex.org/W3015191643","https://openalex.org/W3015199127","https://openalex.org/W3086154751","https://openalex.org/W3096893582","https://openalex.org/W3097777922","https://openalex.org/W3099330747","https://openalex.org/W3163652268","https://openalex.org/W3163842642","https://openalex.org/W4280557595","https://openalex.org/W4388117238","https://openalex.org/W4391021644","https://openalex.org/W6698138081","https://openalex.org/W6798326965","https://openalex.org/W6844662008"],"related_works":["https://openalex.org/W2017779656","https://openalex.org/W2001172292","https://openalex.org/W2169567031","https://openalex.org/W1849802015","https://openalex.org/W3097766872","https://openalex.org/W2091951235","https://openalex.org/W4239222529","https://openalex.org/W2354873283","https://openalex.org/W2033914206","https://openalex.org/W2042327336"],"abstract_inverted_index":{"Separation":[0],"of":[1,8,41,87,92,112],"overlapping":[2],"speakers":[3],"remains":[4],"an":[5],"active":[6],"area":[7],"speech":[9],"technology":[10],"research.":[11],"Many":[12],"deep":[13],"neural":[14],"network":[15],"(DNN)":[16],"separation":[17],"models":[18,33],"propose":[19],"modelling":[20],"local":[21],"and":[22,36,47,57,102,124,135,139],"global":[23],"temporal":[24],"context":[25],"separately":[26],"using":[27,145],"alternating":[28],"DNN":[29],"layers.":[30],"Two":[31],"such":[32],"are":[34,96],"SepFormer":[35,51],"TD-Conformer.":[37],"The":[38,84,115,142],"largest":[39],"configurations":[40],"each":[42],"have":[43],"comparable":[44],"computational":[45,79],"cost":[46],"similar":[48],"performance;":[49],"with":[50],"performing":[52],"better":[53,60],"on":[54,62,99,137,156],"anechoic":[55],"data":[56],"TD-Conformer":[58],"yielding":[59],"results":[61],"noisy":[63],"reverberant":[64],"data.":[65],"This":[66],"work":[67],"combines":[68],"these":[69],"two":[70],"model":[71,90,117,143],"types":[72],"to":[73,120,149],"gain":[74],"insights":[75],"into":[76],"how":[77],"their":[78,82],"characteristics":[80],"affect":[81],"performance.":[83],"generalization":[85],"benefits":[86],"the":[88,93,100,103,157],"larger":[89],"size":[91],"conformer":[94],"layers":[95],"demonstrated":[97],"both":[98],"WHAMR":[101,146],"out-of-domain":[104,158],"far-field":[105],"evaluation":[106,113],"set":[107],"MC-WSJ-AV":[108,159],"across":[109],"a":[110],"number":[111],"metrics.":[114],"proposed":[116],"is":[118,147],"able":[119,148],"achieve":[121,150],"22.1":[122],"dB":[123,126,152],"14.7":[125],"average":[127,153],"scale-invariant":[128],"signal-to-distortion":[129],"ratio":[130],"(SISDR)":[131],"improvement":[132,155],"when":[133],"trained":[134,144],"evaluated":[136],"WSJ0-2Mix":[138],"WHAMR,":[140],"respectively.":[141],"4.3":[151],"SISDR":[154],"dataset.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
