{"id":"https://openalex.org/W2889224938","doi":"https://doi.org/10.21437/interspeech.2018-2196","title":"Integrating Neural Network Based Beamforming and Weighted Prediction Error Dereverberation","display_name":"Integrating Neural Network Based Beamforming and Weighted Prediction Error Dereverberation","publication_year":2018,"publication_date":"2018-08-28","ids":{"openalex":"https://openalex.org/W2889224938","doi":"https://doi.org/10.21437/interspeech.2018-2196","mag":"2889224938"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2018-2196","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-2196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011191228","display_name":"Lukas Drude","orcid":"https://orcid.org/0000-0003-3683-5432"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lukas Drude","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064522438","display_name":"Christoph Boeddeker","orcid":"https://orcid.org/0000-0002-8701-1567"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christoph Boeddeker","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006131416","display_name":"Jahn Heymann","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jahn Heymann","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082075598","display_name":"Reinhold Haeb\u2010Umbach","orcid":"https://orcid.org/0000-0001-9468-7330"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reinhold Haeb-Umbach","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069398831","display_name":"Keisuke Kinoshita","orcid":"https://orcid.org/0009-0008-7987-8188"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Keisuke Kinoshita","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023868166","display_name":"Marc Delcroix","orcid":"https://orcid.org/0000-0002-5175-7834"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marc Delcroix","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5021240106","display_name":"Tomohiro Nakatani","orcid":"https://orcid.org/0000-0002-7487-7150"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomohiro Nakatani","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5011191228"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.4589,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.95557913,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3043","last_page":"3047"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10822","display_name":"Acoustic Wave Phenomena Research","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.7394979000091553},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6954284906387329},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5973769426345825},{"id":"https://openalex.org/keywords/mean-squared-prediction-error","display_name":"Mean squared prediction error","score":0.5830076932907104},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.44224148988723755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37911301851272583},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3040471374988556},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.1482553780078888}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.7394979000091553},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6954284906387329},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5973769426345825},{"id":"https://openalex.org/C167085575","wikidata":"https://www.wikidata.org/wiki/Q6803654","display_name":"Mean squared prediction error","level":2,"score":0.5830076932907104},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.44224148988723755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37911301851272583},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3040471374988556},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.1482553780078888}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2018-2196","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-2196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1902027874","https://openalex.org/W1935589317","https://openalex.org/W1983812858","https://openalex.org/W1989314204","https://openalex.org/W2003203076","https://openalex.org/W2025768430","https://openalex.org/W2130722890","https://openalex.org/W2140571699","https://openalex.org/W2147166770","https://openalex.org/W2158143227","https://openalex.org/W2164502538","https://openalex.org/W2176412452","https://openalex.org/W2290318471","https://openalex.org/W2591355762","https://openalex.org/W2678124624","https://openalex.org/W2748661748","https://openalex.org/W2966212213","https://openalex.org/W4302156456"],"related_works":["https://openalex.org/W2963170046","https://openalex.org/W2376244802","https://openalex.org/W4311414679","https://openalex.org/W2923631784","https://openalex.org/W818226659","https://openalex.org/W2158075901","https://openalex.org/W2567141277","https://openalex.org/W2130785056","https://openalex.org/W2727286692","https://openalex.org/W2367528705"],"abstract_inverted_index":{"The":[0],"weighted":[1],"prediction":[2],"error":[3,114],"(WPE)":[4],"algorithm":[5],"has":[6,42],"proven":[7],"to":[8,52,60,96,156],"be":[9,50],"a":[10,62,65,78,111,134,170],"very":[11,28],"successful":[12],"dereverberation":[13,54,136],"method":[14],"for":[15,25],"the":[16,33,81,151,158],"REVERB":[17],"challenge.":[18],"Likewise,":[19],"neural":[20,66,99,171],"network":[21,100],"based":[22,101,130],"mask":[23],"estimation":[24],"beamforming":[26,102,131,149],"demonstrated":[27],"good":[29],"noise":[30,162],"suppression":[31],"in":[32,154],"CHiME":[34,37],"3":[35],"and":[36,55,68,92,140,161,169],"4":[38],"challenges.":[39],"Recently,":[40],"it":[41],"been":[43],"shown":[44],"that":[45,127],"this":[46],"estimator":[47],"can":[48],"also":[49],"trained":[51],"perform":[53],"denoising":[56],"jointly.":[57],"However,":[58],"up":[59],"now":[61],"comparison":[63,155],"of":[64,80,90,167],"beamformer":[67,172],"WPE":[69,157,168],"is":[70,74],"still":[71],"missing,":[72],"so":[73],"an":[75,87],"investigation":[76],"into":[77],"combination":[79],"two.":[82],"Therefore,":[83],"we":[84,109],"here":[85],"provide":[86],"extensive":[88],"evaluation":[89],"both":[91],"consequently":[93],"propose":[94],"variants":[95,108],"integrate":[97],"deep":[98,128],"with":[103],"WPE.":[104],"For":[105],"these":[106],"integrated":[107],"identify":[110],"consistent":[112],"word":[113],"rate":[115],"(WER)":[116],"reduction":[117],"on":[118],"two":[119],"distinct":[120],"databases.":[121],"In":[122],"particular,":[123],"our":[124],"study":[125],"shows":[126],"learning":[129],"benefits":[132],"from":[133],"model-based":[135],"technique":[137],"(i.e.":[138],"WPE)":[139],"vice":[141],"versa.":[142],"Our":[143],"key":[144],"findings":[145],"are:":[146],"(a)":[147],"Neural":[148],"yields":[150],"lower":[152],"WERs":[153],"more":[159],"channels":[160],"are":[163],"present.":[164],"(b)":[165],"Integration":[166],"consistently":[173],"outperforms":[174],"all":[175],"stand-alone":[176],"systems.":[177]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":12},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
