{"id":"https://openalex.org/W3109458322","doi":"https://doi.org/10.1109/taslp.2020.3036776","title":"Online Multichannel Speech Enhancement Based on Recursive EM and DNN-Based Speech Presence Estimation","display_name":"Online Multichannel Speech Enhancement Based on Recursive EM and DNN-Based Speech Presence Estimation","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3109458322","doi":"https://doi.org/10.1109/taslp.2020.3036776","mag":"3109458322"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2020.3036776","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2020.3036776","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://vbn.aau.dk/da/publications/13577556-6433-4324-a69c-7167ca6b7e2a","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064609638","display_name":"Juan M. Mart\u00edn-Do\u00f1as","orcid":"https://orcid.org/0000-0003-4874-0166"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Juan Manuel Mart\u00edn-Do\u00f1as","raw_affiliation_strings":["Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain"],"raw_orcid":"https://orcid.org/0000-0003-4874-0166","affiliations":[{"raw_affiliation_string":"Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101679595","display_name":"Jesper Jensen","orcid":"https://orcid.org/0000-0003-1478-622X"},"institutions":[{"id":"https://openalex.org/I4210130492","display_name":"Oticon Medical (Denmark)","ror":"https://ror.org/03c5ds320","country_code":"DK","type":"company","lineage":["https://openalex.org/I4210130492"]},{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Jesper Jensen","raw_affiliation_strings":["Department of Electronic Systems, Aalborg University, Aalborg, Denmark","Oticon A/S, Sm\u00f8rum, Denmark"],"raw_orcid":"https://orcid.org/0000-0003-1478-622X","affiliations":[{"raw_affiliation_string":"Department of Electronic Systems, Aalborg University, Aalborg, Denmark","institution_ids":["https://openalex.org/I891191580"]},{"raw_affiliation_string":"Oticon A/S, Sm\u00f8rum, Denmark","institution_ids":["https://openalex.org/I4210130492"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090108098","display_name":"Zheng\u2010Hua Tan","orcid":"https://orcid.org/0000-0001-6856-8928"},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Zheng-Hua Tan","raw_affiliation_strings":["Department of Electronic Systems, Aalborg University, Aalborg, Denmark"],"raw_orcid":"https://orcid.org/0000-0001-6856-8928","affiliations":[{"raw_affiliation_string":"Department of Electronic Systems, Aalborg University, Aalborg, Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024291487","display_name":"\u00c1ngel M. G\u00f3mez","orcid":"https://orcid.org/0000-0002-9995-3068"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Angel M. Gomez","raw_affiliation_strings":["Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain"],"raw_orcid":"https://orcid.org/0000-0002-9995-3068","affiliations":[{"raw_affiliation_string":"Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078514616","display_name":"Antonio M. Peinado","orcid":"https://orcid.org/0000-0001-8214-6676"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Antonio M. Peinado","raw_affiliation_strings":["Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain"],"raw_orcid":"https://orcid.org/0000-0001-8214-6676","affiliations":[{"raw_affiliation_string":"Department of Signal Theory, Telematics and Communications, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2811,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.89186016,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"28","issue":null,"first_page":"3080","last_page":"3094"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7860057353973389},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.734100341796875},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6551425457000732},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.6482023596763611},{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.5788141489028931},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.5320476293563843},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.5077341794967651},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3397766947746277},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.331390380859375},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12709325551986694},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.07560837268829346}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7860057353973389},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.734100341796875},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6551425457000732},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.6482023596763611},{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.5788141489028931},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.5320476293563843},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.5077341794967651},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3397766947746277},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.331390380859375},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12709325551986694},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.07560837268829346},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/taslp.2020.3036776","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2020.3036776","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:openaire/13577556-6433-4324-a69c-7167ca6b7e2a","is_oa":true,"landing_page_url":"https://vbn.aau.dk/da/publications/13577556-6433-4324-a69c-7167ca6b7e2a","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Mart\u00edn-Do\u00f1as, J M, Jensen, J, Tan, Z-H, Gomez, A & Peinado, A 2020, 'Online Multichannel Speech Enhancement Based on Recursive EM and DNN-based Speech Presence Estimation', IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 28, 9252844, pp. 3080-3094. https://doi.org/10.1109/TASLP.2020.3036776","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:digibug.ugr.es:10481/71502","is_oa":true,"landing_page_url":"http://hdl.handle.net/10481/71502","pdf_url":null,"source":{"id":"https://openalex.org/S4306400567","display_name":"Institutional Repository of the University of Granada (University of Granada)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I173304897","host_organization_name":"Universidad de Granada","host_organization_lineage":["https://openalex.org/I173304897"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:pure.atira.dk:publications/13577556-6433-4324-a69c-7167ca6b7e2a","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85096859719&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Mart\u00edn-Do\u00f1as , J M , Jensen , J , Tan , Z-H , Gomez , A &amp; Peinado , A 2020 , ' Online Multichannel Speech Enhancement Based on Recursive EM and DNN-based Speech Presence Estimation ' , IEEE/ACM Transactions on Audio, Speech, and Language Processing , vol. 28 , 9252844 , pp. 3080-3094 . https://doi.org/10.1109/TASLP.2020.3036776","raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire/13577556-6433-4324-a69c-7167ca6b7e2a","is_oa":true,"landing_page_url":"https://vbn.aau.dk/da/publications/13577556-6433-4324-a69c-7167ca6b7e2a","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Mart\u00edn-Do\u00f1as, J M, Jensen, J, Tan, Z-H, Gomez, A & Peinado, A 2020, 'Online Multichannel Speech Enhancement Based on Recursive EM and DNN-based Speech Presence Estimation', IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 28, 9252844, pp. 3080-3094. https://doi.org/10.1109/TASLP.2020.3036776","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7300000190734863,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G3690828678","display_name":null,"funder_award_id":"PID2019","funder_id":"https://openalex.org/F4320322930","funder_display_name":"Ministerio de Ciencia e Innovaci\u00f3n"},{"id":"https://openalex.org/G7399548993","display_name":null,"funder_award_id":"PID2019-104206GB-I00","funder_id":"https://openalex.org/F4320322930","funder_display_name":"Ministerio de Ciencia e Innovaci\u00f3n"}],"funders":[{"id":"https://openalex.org/F4320322930","display_name":"Ministerio de Ciencia e Innovaci\u00f3n","ror":"https://ror.org/034900433"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W250076511","https://openalex.org/W1503775994","https://openalex.org/W1686266550","https://openalex.org/W1965392255","https://openalex.org/W1982728343","https://openalex.org/W1991727068","https://openalex.org/W1997109056","https://openalex.org/W2016100027","https://openalex.org/W2018384136","https://openalex.org/W2039199275","https://openalex.org/W2066218102","https://openalex.org/W2111732517","https://openalex.org/W2112469598","https://openalex.org/W2118354544","https://openalex.org/W2120608389","https://openalex.org/W2139916917","https://openalex.org/W2141998673","https://openalex.org/W2143027228","https://openalex.org/W2146324387","https://openalex.org/W2147665979","https://openalex.org/W2147817981","https://openalex.org/W2148024641","https://openalex.org/W2158698691","https://openalex.org/W2164082598","https://openalex.org/W2169399159","https://openalex.org/W2336913545","https://openalex.org/W2398042854","https://openalex.org/W2400112243","https://openalex.org/W2408744528","https://openalex.org/W2516001803","https://openalex.org/W2536388235","https://openalex.org/W2559260703","https://openalex.org/W2563666542","https://openalex.org/W2568308529","https://openalex.org/W2586584460","https://openalex.org/W2591810467","https://openalex.org/W2657050993","https://openalex.org/W2702006285","https://openalex.org/W2743121184","https://openalex.org/W2752530932","https://openalex.org/W2791272514","https://openalex.org/W2807518508","https://openalex.org/W2890553422","https://openalex.org/W2900091068","https://openalex.org/W2903058076","https://openalex.org/W2942172990","https://openalex.org/W2945191446","https://openalex.org/W2951183478","https://openalex.org/W2963488660","https://openalex.org/W2964058413","https://openalex.org/W2964121744","https://openalex.org/W2970789614","https://openalex.org/W2972757492","https://openalex.org/W2973918989","https://openalex.org/W6631190155","https://openalex.org/W6767448423"],"related_works":["https://openalex.org/W2120771489","https://openalex.org/W2051376034","https://openalex.org/W2955597484","https://openalex.org/W3110551121","https://openalex.org/W2089240210","https://openalex.org/W2131486661","https://openalex.org/W111365173","https://openalex.org/W2161396743","https://openalex.org/W2386453889","https://openalex.org/W3134790285"],"abstract_inverted_index":{"This":[0,84],"article":[1],"presents":[2],"a":[3,91,101],"recursive":[4],"expectation-maximization":[5],"algorithm":[6,95,123],"for":[7,74,106,158],"online":[8,107],"multichannel":[9,132],"speech":[10,23,39,45,55,60,63,119],"enhancement.":[11],"A":[12],"deep":[13],"neural":[14],"network":[15],"mask":[16],"estimator":[17],"is":[18,27,47,87,124],"used":[19,68],"to":[20,69],"compute":[21,70],"the":[22,37,71,97,131,135],"presence":[24,56,64],"probability,":[25],"which":[26],"then":[28],"improved":[29],"by":[30,78],"means":[31,79],"of":[32,36,80,134],"statistical":[33,103],"spatial":[34,116],"models":[35],"noisy":[38,128],"and":[40,54,62,76,117],"noise":[41,151],"signals.":[42],"The":[43,58,94,138],"clean":[44,59],"signal":[46],"estimated":[48],"using":[49,130],"beamforming,":[50],"single-channel":[51],"linear":[52],"postfiltering":[53,77],"masking.":[57],"statistics":[61],"probabilities":[65],"are":[66],"finally":[67],"acoustic":[72],"parameters":[73],"beamforming":[75],"maximum":[81],"likelihood":[82],"estimation.":[83],"iterative":[85],"procedure":[86],"carried":[88],"out":[89],"on":[90],"frame-by-frame":[92],"basis.":[93],"integrates":[96],"different":[98,127],"estimates":[99],"in":[100,126,150],"common":[102],"framework":[104],"suitable":[105],"scenarios.":[108],"Moreover,":[109],"our":[110,143],"method":[111,144],"can":[112],"successfully":[113],"exploit":[114],"spectral,":[115],"temporal":[118],"properties.":[120],"Our":[121],"proposed":[122],"tested":[125],"environments":[129],"recordings":[133],"CHiME-4":[136],"database.":[137],"experimental":[139],"results":[140],"show":[141],"that":[142],"outperforms":[145],"other":[146],"related":[147],"state-of-the-art":[148],"approaches":[149],"reduction":[152],"performance,":[153],"while":[154],"allowing":[155],"low-latency":[156],"processing":[157],"real-time":[159],"applications.":[160]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
