{"id":"https://openalex.org/W2180972031","doi":"https://doi.org/10.1186/s13634-015-0278-y","title":"Environment-dependent denoising autoencoder for distant-talking speech recognition","display_name":"Environment-dependent denoising autoencoder for distant-talking speech recognition","publication_year":2015,"publication_date":"2015-11-12","ids":{"openalex":"https://openalex.org/W2180972031","doi":"https://doi.org/10.1186/s13634-015-0278-y","mag":"2180972031"},"language":"en","primary_location":{"id":"doi:10.1186/s13634-015-0278-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0278-y","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13634-015-0278-y","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13634-015-0278-y","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100901893","display_name":"Yuma Ueda","orcid":null},"institutions":[{"id":"https://openalex.org/I1298590031","display_name":"Shizuoka University","ror":"https://ror.org/01w6wtk13","country_code":"JP","type":"education","lineage":["https://openalex.org/I1298590031"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yuma Ueda","raw_affiliation_strings":["Graduate School of Engineering, Shizuoka University, Johoku Naka-ku, Hamamatsu, 432-8561, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, Shizuoka University, Johoku Naka-ku, Hamamatsu, 432-8561, Japan","institution_ids":["https://openalex.org/I1298590031"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101745213","display_name":"Longbiao Wang","orcid":"https://orcid.org/0000-0002-8094-6861"},"institutions":[{"id":"https://openalex.org/I85922643","display_name":"Nagaoka University of Technology","ror":"https://ror.org/00ys1hz88","country_code":"JP","type":"education","lineage":["https://openalex.org/I85922643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Longbiao Wang","raw_affiliation_strings":["Nagaoka University of Technology, 1603-1 Kamitomioka, Nagaoka, 940-2188, Japan"],"affiliations":[{"raw_affiliation_string":"Nagaoka University of Technology, 1603-1 Kamitomioka, Nagaoka, 940-2188, Japan","institution_ids":["https://openalex.org/I85922643"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071123569","display_name":"Atsuhiko Kai","orcid":null},"institutions":[{"id":"https://openalex.org/I1298590031","display_name":"Shizuoka University","ror":"https://ror.org/01w6wtk13","country_code":"JP","type":"education","lineage":["https://openalex.org/I1298590031"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Atsuhiko Kai","raw_affiliation_strings":["Graduate School of Engineering, Shizuoka University, Johoku Naka-ku, Hamamatsu, 432-8561, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, Shizuoka University, Johoku Naka-ku, Hamamatsu, 432-8561, Japan","institution_ids":["https://openalex.org/I1298590031"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041413561","display_name":"Bo Ren","orcid":"https://orcid.org/0000-0002-0481-5069"},"institutions":[{"id":"https://openalex.org/I85922643","display_name":"Nagaoka University of Technology","ror":"https://ror.org/00ys1hz88","country_code":"JP","type":"education","lineage":["https://openalex.org/I85922643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Bo Ren","raw_affiliation_strings":["Nagaoka University of Technology, 1603-1 Kamitomioka, Nagaoka, 940-2188, Japan"],"affiliations":[{"raw_affiliation_string":"Nagaoka University of Technology, 1603-1 Kamitomioka, Nagaoka, 940-2188, Japan","institution_ids":["https://openalex.org/I85922643"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100901893"],"corresponding_institution_ids":["https://openalex.org/I1298590031"],"apc_list":{"value":1140,"currency":"GBP","value_usd":1398},"apc_paid":{"value":1140,"currency":"GBP","value_usd":1398},"fwci":2.6057,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.90637199,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"2015","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.8870388269424438},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7520952224731445},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.714292049407959},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6389050483703613},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5443766117095947},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.49434590339660645},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4855446517467499},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4815123975276947},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4814388155937195},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47367578744888306},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39736413955688477},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.3810465931892395},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35345304012298584},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.21298813819885254},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12006932497024536}],"concepts":[{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.8870388269424438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7520952224731445},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.714292049407959},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6389050483703613},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5443766117095947},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.49434590339660645},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4855446517467499},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4815123975276947},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4814388155937195},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47367578744888306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39736413955688477},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.3810465931892395},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35345304012298584},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.21298813819885254},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12006932497024536},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1186/s13634-015-0278-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0278-y","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13634-015-0278-y","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1186/s13634-015-0278-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13634-015-0278-y","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13634-015-0278-y","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3311735153","display_name":"\u8b58\u5225\u7684\u7279\u5fb4\u62bd\u51fa\u3068\u78ba\u7387\u30e2\u30c7\u30eb\u306b\u57fa\u3065\u304f\u591a\u69d8\u306a\u74b0\u5883\u30fb\u767a\u58f0\u5909\u52d5\u306b\u9811\u5065\u306a\u97f3\u58f0\u8a8d\u8b58","funder_award_id":"15K16020","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5786340949","display_name":null,"funder_award_id":"KAKENHI Grant Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8716678415","display_name":"\u540c\u548c\u6559\u80b2\u306b\u304a\u3051\u308b\u9032\u8def\u6307\u5c0e\u306e\u5b9f\u8df5\u7684\u7814\u7a76","funder_award_id":"16020","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320315567","display_name":"Kayamori Foundation of Informational Science","ror":null},{"id":"https://openalex.org/F4320315724","display_name":"Kayamori Foundation of Informational Science Advancement","ror":null},{"id":"https://openalex.org/F4320325763","display_name":"Telecommunications Advancement Foundation","ror":"https://ror.org/05y77zf79"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2180972031.pdf","grobid_xml":"https://content.openalex.org/works/W2180972031.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W177307080","https://openalex.org/W1499999342","https://openalex.org/W1524333225","https://openalex.org/W1544785557","https://openalex.org/W1583048384","https://openalex.org/W1973669708","https://openalex.org/W1973681148","https://openalex.org/W1981706894","https://openalex.org/W1982846521","https://openalex.org/W1985242443","https://openalex.org/W1989314204","https://openalex.org/W1998229164","https://openalex.org/W2009106392","https://openalex.org/W2026136559","https://openalex.org/W2042071805","https://openalex.org/W2047769394","https://openalex.org/W2053150333","https://openalex.org/W2062164080","https://openalex.org/W2069976350","https://openalex.org/W2078528584","https://openalex.org/W2079623482","https://openalex.org/W2091828388","https://openalex.org/W2100495367","https://openalex.org/W2103564015","https://openalex.org/W2110322414","https://openalex.org/W2112748425","https://openalex.org/W2114782757","https://openalex.org/W2128653836","https://openalex.org/W2130722890","https://openalex.org/W2132054610","https://openalex.org/W2132214945","https://openalex.org/W2142117481","https://openalex.org/W2145094598","https://openalex.org/W2147166770","https://openalex.org/W2148898720","https://openalex.org/W2151435578","https://openalex.org/W2165548826","https://openalex.org/W2219673179","https://openalex.org/W2296581541","https://openalex.org/W2394498270","https://openalex.org/W2405774341","https://openalex.org/W2762693443","https://openalex.org/W3145668479","https://openalex.org/W6600280466","https://openalex.org/W6600567258","https://openalex.org/W6836791025"],"related_works":["https://openalex.org/W2159052453","https://openalex.org/W3013693939","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W2734887215","https://openalex.org/W2803255133","https://openalex.org/W2909431601","https://openalex.org/W3037110488"],"abstract_inverted_index":{"In":[0,72,117,169],"this":[1],"paper,":[2],"we":[3,101,121,157,173],"propose":[4,102,158],"an":[5,93],"environment-dependent":[6,104,150,188,212,227,266,272],"denoising":[7],"autoencoder":[8],"(DAE)":[9],"and":[10,42,49,69,84,114,131,166,203,221,257],"automatic":[11],"environment":[12,154,232],"identification":[13,155,233],"based":[14,234],"on":[15,235],"a":[16,61,73,148,159,186,191],"deep":[17],"neural":[18],"network":[19],"(DNN)":[20],"with":[21],"blind":[22],"reverberation":[23,43,176,258],"estimation":[24],"for":[25,134],"robust":[26],"distant-talking":[27],"speech":[28,83,86,126,165,200,254],"recognition.":[29],"Recently,":[30],"DAEs":[31,105,124],"have":[32],"been":[33],"shown":[34],"to":[35,106,178],"be":[36,58],"effective":[37],"in":[38,66,201,218,250],"many":[39],"noise":[40],"reduction":[41],"suppression":[44],"applications":[45],"because":[46],"higher-level":[47],"representations":[48],"increased":[50],"flexibility":[51],"of":[52,81,110,181,231,245],"the":[53,98,108,118,132,135,140,170,179,182,211,215,229,236,246,264,270],"feature":[54],"mapping":[55],"function":[56],"can":[57],"learned.":[59],"However,":[60],"DAE":[62,133,183,189,213,267],"is":[63,143,197,240,255,259],"not":[64,260],"adequate":[65],"mismatched":[67],"training":[68,113],"test":[70,115,141],"environments.":[71,116,206,224],"conventional":[74,247],"DAE,":[75,228],"parameters":[76],"are":[77],"trained":[78],"using":[79,125,199],"pairs":[80],"reverberant":[82,164,205,223,253],"clean":[85],"under":[87],"various":[88,123],"acoustic":[89,129],"conditions":[90],"(that":[91,146,184],"is,":[92,147,185],"environment-independent":[94,216],"DAE).":[95,151,193],"To":[96,152],"address":[97],"above":[99],"problem,":[100],"two":[103],"reduce":[107],"influence":[109],"mismatches":[111],"between":[112],"first":[119],"approach,":[120,172,249],"train":[122],"from":[127],"different":[128],"environments,":[130],"condition":[136,142],"that":[137,161,210,244],"best":[138],"matches":[139],"automatically":[144],"selected":[145],"two-step":[149,226,271],"improve":[153],"performance,":[156],"DNN":[160,238,248],"uses":[162],"both":[163,219],"estimated":[167,175],"reverberation.":[168],"second":[171],"add":[174],"features":[177],"input":[180],"one-step":[187,265],"or":[190],"reverberation-aware":[192],"The":[194],"proposed":[195,237],"method":[196],"evaluated":[198],"simulated":[202,220],"real":[204,222],"Experimental":[207],"results":[208],"show":[209],"outperforms":[214,269],"one":[217],"For":[225],"performance":[230],"approach":[239],"also":[241],"better":[242],"than":[243],"which":[251],"only":[252],"used":[256],"blindly":[261],"estimated.":[262],"And,":[263],"significantly":[268],"DAE.":[273]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
