{"id":"https://openalex.org/W2768848988","doi":"https://doi.org/10.1109/taslp.2018.2821899","title":"Speech Dereverberation With Context-Aware Recurrent Neural Networks","display_name":"Speech Dereverberation With Context-Aware Recurrent Neural Networks","publication_year":2018,"publication_date":"2018-04-02","ids":{"openalex":"https://openalex.org/W2768848988","doi":"https://doi.org/10.1109/taslp.2018.2821899","mag":"2768848988"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2018.2821899","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2821899","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1711.06309","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068457267","display_name":"Jo\u00e3o Felipe Santos","orcid":"https://orcid.org/0000-0003-3934-3943"},"institutions":[{"id":"https://openalex.org/I197604219","display_name":"National Academies of Sciences, Engineering, and Medicine","ror":"https://ror.org/02eq2w707","country_code":"US","type":"government","lineage":["https://openalex.org/I197604219"]},{"id":"https://openalex.org/I39481719","display_name":"Institut National de la Recherche Scientifique","ror":"https://ror.org/04td37d32","country_code":"CA","type":"education","lineage":["https://openalex.org/I39481719","https://openalex.org/I49663120"]}],"countries":["CA","US"],"is_corresponding":true,"raw_author_name":"Joao Felipe Santos","raw_affiliation_strings":["Institut national de la recherche scientifique, Quebec, QC, CA","\u00c9nergie, Mat\u00e9riaux, T\u00e9l\u00e9communications Research Centre, Institut National de la Recherche Scientifique, Montr\u00e9al, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Institut national de la recherche scientifique, Quebec, QC, CA","institution_ids":["https://openalex.org/I197604219"]},{"raw_affiliation_string":"\u00c9nergie, Mat\u00e9riaux, T\u00e9l\u00e9communications Research Centre, Institut National de la Recherche Scientifique, Montr\u00e9al, QC, Canada","institution_ids":["https://openalex.org/I39481719"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065418889","display_name":"Tiago H. Falk","orcid":"https://orcid.org/0000-0002-5739-2514"},"institutions":[{"id":"https://openalex.org/I197604219","display_name":"National Academies of Sciences, Engineering, and Medicine","ror":"https://ror.org/02eq2w707","country_code":"US","type":"government","lineage":["https://openalex.org/I197604219"]},{"id":"https://openalex.org/I39481719","display_name":"Institut National de la Recherche Scientifique","ror":"https://ror.org/04td37d32","country_code":"CA","type":"education","lineage":["https://openalex.org/I39481719","https://openalex.org/I49663120"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Tiago H. Falk","raw_affiliation_strings":["Institut national de la recherche scientifique, Quebec, QC, CA","\u00c9nergie, Mat\u00e9riaux, T\u00e9l\u00e9communications Research Centre, Institut National de la Recherche Scientifique, Montr\u00e9al, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Institut national de la recherche scientifique, Quebec, QC, CA","institution_ids":["https://openalex.org/I197604219"]},{"raw_affiliation_string":"\u00c9nergie, Mat\u00e9riaux, T\u00e9l\u00e9communications Research Centre, Institut National de la Recherche Scientifique, Montr\u00e9al, QC, Canada","institution_ids":["https://openalex.org/I39481719"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068457267"],"corresponding_institution_ids":["https://openalex.org/I197604219","https://openalex.org/I39481719"],"apc_list":null,"apc_paid":null,"fwci":0.1658,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.4072051,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"26","issue":"7","first_page":"1236","last_page":"1246"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.9104824066162109},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7618564963340759},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7437195181846619},{"id":"https://openalex.org/keywords/pesq","display_name":"PESQ","score":0.5996918678283691},{"id":"https://openalex.org/keywords/impulse","display_name":"Impulse (physics)","score":0.5062255263328552},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4948837161064148},{"id":"https://openalex.org/keywords/impulse-response","display_name":"Impulse response","score":0.48812612891197205},{"id":"https://openalex.org/keywords/active-listening","display_name":"Active listening","score":0.4721249043941498},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.46513575315475464},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.45499783754348755},{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.44439876079559326},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.43397560715675354},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43283021450042725},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.42827659845352173},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3147791028022766},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.19623544812202454},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.18573680520057678},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12108975648880005}],"concepts":[{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.9104824066162109},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7618564963340759},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7437195181846619},{"id":"https://openalex.org/C103734657","wikidata":"https://www.wikidata.org/wiki/Q2739975","display_name":"PESQ","level":4,"score":0.5996918678283691},{"id":"https://openalex.org/C70836080","wikidata":"https://www.wikidata.org/wiki/Q837940","display_name":"Impulse (physics)","level":2,"score":0.5062255263328552},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4948837161064148},{"id":"https://openalex.org/C72279823","wikidata":"https://www.wikidata.org/wiki/Q1139726","display_name":"Impulse response","level":2,"score":0.48812612891197205},{"id":"https://openalex.org/C177291462","wikidata":"https://www.wikidata.org/wiki/Q423038","display_name":"Active listening","level":2,"score":0.4721249043941498},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.46513575315475464},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.45499783754348755},{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.44439876079559326},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.43397560715675354},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43283021450042725},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.42827659845352173},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3147791028022766},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.19623544812202454},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.18573680520057678},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12108975648880005},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/taslp.2018.2821899","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2821899","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1711.06309","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1711.06309","pdf_url":"https://arxiv.org/pdf/1711.06309","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2768848988","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1711.06309.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1711.06309","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1711.06309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1711.06309","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1711.06309","pdf_url":"https://arxiv.org/pdf/1711.06309","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.4699999988079071}],"awards":[{"id":"https://openalex.org/G1833903074","display_name":null,"funder_award_id":"K40 GPU","funder_id":"https://openalex.org/F4320309480","funder_display_name":"Nvidia"},{"id":"https://openalex.org/G2010355708","display_name":null,"funder_award_id":"Tesla K40 GPU","funder_id":"https://openalex.org/F4320309480","funder_display_name":"Nvidia"},{"id":"https://openalex.org/G5801408398","display_name":null,"funder_award_id":"Tesla K40","funder_id":"https://openalex.org/F4320309480","funder_display_name":"Nvidia"}],"funders":[{"id":"https://openalex.org/F4320309327","display_name":"Google","ror":"https://ror.org/00njsd438"},{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320321747","display_name":"Fonds Qu\u00e9b\u00e9cois de la Recherche sur la Nature et les Technologies","ror":"https://ror.org/00b9f9778"},{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2768848988.pdf","grobid_xml":"https://content.openalex.org/works/W2768848988.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1522199561","https://openalex.org/W1603978816","https://openalex.org/W1810943226","https://openalex.org/W1888374534","https://openalex.org/W1973669708","https://openalex.org/W2001124347","https://openalex.org/W2006129368","https://openalex.org/W2041119287","https://openalex.org/W2044893557","https://openalex.org/W2046869671","https://openalex.org/W2069681747","https://openalex.org/W2094461119","https://openalex.org/W2101042021","https://openalex.org/W2120847449","https://openalex.org/W2125114513","https://openalex.org/W2141998673","https://openalex.org/W2151938450","https://openalex.org/W2172140247","https://openalex.org/W2172491908","https://openalex.org/W2233657726","https://openalex.org/W2401206005","https://openalex.org/W2406737436","https://openalex.org/W2407277936","https://openalex.org/W2542605056","https://openalex.org/W2575485141","https://openalex.org/W2587329895","https://openalex.org/W2609317876","https://openalex.org/W2668911695","https://openalex.org/W2708109968","https://openalex.org/W2949382160","https://openalex.org/W2964121744","https://openalex.org/W2964199361","https://openalex.org/W6631190155","https://openalex.org/W6638273328","https://openalex.org/W6640090968","https://openalex.org/W6680987062","https://openalex.org/W6712262472"],"related_works":["https://openalex.org/W2994785103","https://openalex.org/W3198661668","https://openalex.org/W26243928","https://openalex.org/W2886938596","https://openalex.org/W2591355762","https://openalex.org/W2951616896","https://openalex.org/W2795050058","https://openalex.org/W2287873126","https://openalex.org/W3155401483","https://openalex.org/W2963941778","https://openalex.org/W3156248872","https://openalex.org/W1840572374","https://openalex.org/W3196660995","https://openalex.org/W2797187289","https://openalex.org/W3199713199","https://openalex.org/W2368749372","https://openalex.org/W3198130028","https://openalex.org/W3197982663","https://openalex.org/W2167725581","https://openalex.org/W2139450919"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,40,47,54,65],"model":[6,63,68,119],"to":[7,90,112,122,124],"perform":[8],"speech":[9,96],"dereverberation":[10],"by":[11],"estimating":[12],"its":[13],"spectral":[14],"magnitude":[15],"from":[16,46],"the":[17,37,76,148],"reverberant":[18,113],"counterpart.":[19],"Our":[20,62],"models":[21,153],"are":[22],"capable":[23],"of":[24,51,83,88,95,156],"extracting":[25,59],"features":[26,45],"that":[27,69],"take":[28],"into":[29],"account":[30],"both":[31],"short-":[32],"and":[33,53,103,140],"long-term":[34,60],"dependencies":[35],"in":[36,154],"signal":[38],"through":[39],"convolutional":[41],"encoder":[42],"(which":[43],"extracts":[44],"short,":[48],"bounded":[49],"context":[50,72],"frames)":[52],"recurrent":[55],"neural":[56],"network":[57],"for":[58],"information.":[61],"outperforms":[64],"recently":[66],"proposed":[67,149],"uses":[70],"different":[71,138],"information":[73],"depending":[74],"on":[75,92,99,105],"reverberation":[77,142],"time,":[78],"without":[79],"requiring":[80],"any":[81],"sort":[82],"additional":[84],"input,":[85],"yielding":[86],"improvements":[87],"up":[89],"0.4":[91],"perceptual":[93,106],"evaluation":[94],"quality,":[97],"0.3":[98],"short-time":[100],"objective":[101,107],"intelligibility,":[102],"1.0":[104],"listening":[108,145],"quality":[109],"assessment":[110],"relative":[111],"speech.":[114],"We":[115],"also":[116],"show":[117,147],"our":[118],"is":[120],"able":[121],"generalize":[123],"real":[125],"room":[126,135],"impulse":[127,136],"responses":[128],"even":[129],"when":[130],"only":[131],"trained":[132],"with":[133],"simulated":[134],"responses,":[137],"speakers,":[139],"high":[141],"times.":[143],"Finally,":[144],"tests":[146],"method":[150],"outperforming":[151],"benchmark":[152],"reduction":[155],"perceived":[157],"reverberation.":[158]},"counts_by_year":[{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
