{"id":"https://openalex.org/W1926194041","doi":"https://doi.org/10.1186/s13634-015-0259-1","title":"Feature enhancement of reverberant speech by distribution matching and non-negative matrix factorization","display_name":"Feature enhancement of reverberant speech by distribution matching and non-negative matrix factorization","publication_year":2015,"publication_date":"2015-08-19","ids":{"openalex":"https://openalex.org/W1926194041","doi":"https://doi.org/10.1186/s13634-015-0259-1","mag":"1926194041"},"language":"en","primary_location":{"id":"doi:10.1186/s13634-015-0259-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0259-1","pdf_url":"https://asp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13634-015-0259-1","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13634-015-0259-1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056123362","display_name":"Sami Keronen","orcid":null},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":true,"raw_author_name":"Sami Keronen","raw_affiliation_strings":["Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]"],"affiliations":[{"raw_affiliation_string":"Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","institution_ids":["https://openalex.org/I9927081"]},{"raw_affiliation_string":"[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091409087","display_name":"Heikki Kallasjoki","orcid":null},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Heikki Kallasjoki","raw_affiliation_strings":["Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]"],"affiliations":[{"raw_affiliation_string":"Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","institution_ids":["https://openalex.org/I9927081"]},{"raw_affiliation_string":"[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053741868","display_name":"Kalle Palom\u00e4ki","orcid":null},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Kalle J. Palom\u00e4ki","raw_affiliation_strings":["Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]"],"affiliations":[{"raw_affiliation_string":"Department of Signal Processing and Acoustics, Aalto university, P.O. Box 13000, Aalto, 00076, Finland","institution_ids":["https://openalex.org/I9927081"]},{"raw_affiliation_string":"[Dept. of Signal Processing and Acoustics, Aalto University, Aalto, Finland]","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080527909","display_name":"Guy J. Brown","orcid":"https://orcid.org/0000-0001-8565-5476"},"institutions":[{"id":"https://openalex.org/I91136226","display_name":"University of Sheffield","ror":"https://ror.org/05krs5044","country_code":"GB","type":"education","lineage":["https://openalex.org/I91136226"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Guy J. Brown","raw_affiliation_strings":["Department of Computer Science, University of Sheffield, Regent Court, 211 Portobello, Sheffield, S1 4DP, UK","Department of Computer Science, University of Sheffield, Sheffield, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Sheffield, Regent Court, 211 Portobello, Sheffield, S1 4DP, UK","institution_ids":["https://openalex.org/I91136226"]},{"raw_affiliation_string":"Department of Computer Science, University of Sheffield, Sheffield, UK","institution_ids":["https://openalex.org/I91136226"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109012430","display_name":"Jort F. Gemmeke","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118287","display_name":"AuSIM (United States)","ror":"https://ror.org/02hd3s336","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118287"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jort F. Gemmeke","raw_affiliation_strings":["Audience, Inc., Mountain View, 94043, CA, USA","Audience, Inc., Mountain View, USA"],"affiliations":[{"raw_affiliation_string":"Audience, Inc., Mountain View, 94043, CA, USA","institution_ids":["https://openalex.org/I4210118287"]},{"raw_affiliation_string":"Audience, Inc., Mountain View, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5056123362"],"corresponding_institution_ids":["https://openalex.org/I9927081"],"apc_list":{"value":1140,"currency":"GBP","value_usd":1398},"apc_paid":{"value":1140,"currency":"GBP","value_usd":1398},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05819649,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"2015","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7732052803039551},{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.7051552534103394},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6698519587516785},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5730569362640381},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5445300936698914},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5215066075325012},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5067854523658752},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4996821880340576},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4642539620399475},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.45671382546424866},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4535861313343048},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.4507286250591278},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.1718473732471466},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.1133926510810852}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7732052803039551},{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.7051552534103394},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6698519587516785},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5730569362640381},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5445300936698914},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5215066075325012},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5067854523658752},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4996821880340576},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4642539620399475},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.45671382546424866},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4535861313343048},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.4507286250591278},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.1718473732471466},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.1133926510810852},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s13634-015-0259-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0259-1","pdf_url":"https://asp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13634-015-0259-1","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/26483","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/08d9bec4-625b-43d4-ad59-71b82394e215","pdf_url":null,"source":{"id":"https://openalex.org/S4306401663","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"}],"best_oa_location":{"id":"doi:10.1186/s13634-015-0259-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0259-1","pdf_url":"https://asp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13634-015-0259-1","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.7699999809265137}],"awards":[{"id":"https://openalex.org/G2552001108","display_name":null,"funder_award_id":"ICT-618075","funder_id":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland"},{"id":"https://openalex.org/G4249896723","display_name":null,"funder_award_id":"251170","funder_id":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland"},{"id":"https://openalex.org/G7328963496","display_name":null,"funder_award_id":"136209","funder_id":"https://openalex.org/F4320321108","funder_display_name":"Academy of Finland"}],"funders":[{"id":"https://openalex.org/F4320321108","display_name":"Academy of Finland","ror":"https://ror.org/05k73zm37"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1926194041.pdf","grobid_xml":"https://content.openalex.org/works/W1926194041.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W54525843","https://openalex.org/W1606794504","https://openalex.org/W1989314204","https://openalex.org/W1992272902","https://openalex.org/W1993721840","https://openalex.org/W2026369565","https://openalex.org/W2046317813","https://openalex.org/W2058333183","https://openalex.org/W2086322880","https://openalex.org/W2104298926","https://openalex.org/W2106582496","https://openalex.org/W2113932204","https://openalex.org/W2114016253","https://openalex.org/W2122562222","https://openalex.org/W2125234026","https://openalex.org/W2125436743","https://openalex.org/W2130283666","https://openalex.org/W2130722890","https://openalex.org/W2131118158","https://openalex.org/W2135029798","https://openalex.org/W2138370890","https://openalex.org/W2141520175","https://openalex.org/W2145692202","https://openalex.org/W2147166770","https://openalex.org/W2148898720","https://openalex.org/W2150415460","https://openalex.org/W2158291955","https://openalex.org/W2160815625","https://openalex.org/W2183622110","https://openalex.org/W2184045248","https://openalex.org/W2397819789","https://openalex.org/W2403608536","https://openalex.org/W2726348732","https://openalex.org/W2759056399","https://openalex.org/W2762693443","https://openalex.org/W3143596294"],"related_works":["https://openalex.org/W2104780554","https://openalex.org/W2145692202","https://openalex.org/W2156393451","https://openalex.org/W2076893062","https://openalex.org/W2405184167","https://openalex.org/W1954839664","https://openalex.org/W2482610912","https://openalex.org/W2407147558","https://openalex.org/W2998100475","https://openalex.org/W2539994084"],"abstract_inverted_index":{"This":[0],"paper":[1],"describes":[2],"a":[3,42,48,72,80],"novel":[4],"two-stage":[5],"dereverberation":[6],"feature":[7,97],"enhancement":[8,98],"method":[9],"for":[10],"noise-robust":[11],"automatic":[12,105],"speech":[13,24,35,86,106],"recognition.":[14],"In":[15],"the":[16,22,29,32,56,84,92,114],"first":[17],"stage,":[18],"an":[19,68,89],"estimate":[20,70,90],"of":[21,31,38,58,83,91],"dereverberated":[23,65],"is":[25,110],"generated":[26],"by":[27],"matching":[28],"distribution":[30],"observed":[33],"reverberant":[34],"to":[36,54,112,118],"that":[37,46],"clean":[39,85],"speech,":[40],"in":[41,52,102],"decorrelated":[43],"transformation":[44],"domain":[45],"has":[47],"long":[49],"temporal":[50],"context":[51],"order":[53],"address":[55],"effects":[57],"reverberation.":[59],"The":[60,95],"second":[61],"stage":[62],"uses":[63],"this":[64],"signal":[66,87],"as":[67],"initial":[69],"within":[71],"non-negative":[73],"matrix":[74],"factorization":[75],"framework,":[76],"which":[77],"jointly":[78],"estimates":[79],"sparse":[81],"representation":[82],"and":[88],"convolutional":[93],"distortion.":[94],"proposed":[96],"method,":[99],"when":[100],"used":[101],"conjunction":[103],"with":[104],"recognizer":[107],"back-end":[108],"processing,":[109],"shown":[111],"improve":[113],"recognition":[115],"performance":[116],"compared":[117],"three":[119],"other":[120],"state-of-the-art":[121],"techniques.":[122]},"counts_by_year":[],"updated_date":"2026-03-29T08:15:47.926485","created_date":"2025-10-10T00:00:00"}
