{"id":"https://openalex.org/W3196940724","doi":"https://doi.org/10.1109/icassp43922.2022.9746432","title":"Embedding and Beamforming: All-Neural Causal Beamformer for Multichannel Speech Enhancement","display_name":"Embedding and Beamforming: All-Neural Causal Beamformer for Multichannel Speech Enhancement","publication_year":2022,"publication_date":"2022-04-27","ids":{"openalex":"https://openalex.org/W3196940724","doi":"https://doi.org/10.1109/icassp43922.2022.9746432","mag":"3196940724"},"language":"en","primary_location":{"id":"doi:10.1109/icassp43922.2022.9746432","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9746432","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053757616","display_name":"Andong Li","orcid":"https://orcid.org/0000-0003-4094-8448"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Andong Li","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","University of Chinese Academy of Sciences, Beijing, China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100679522","display_name":"Wenzhe Liu","orcid":"https://orcid.org/0000-0002-0827-6883"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenzhe Liu","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","University of Chinese Academy of Sciences, Beijing, China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100369696","display_name":"Xiaodong Li","orcid":"https://orcid.org/0000-0002-0749-8150"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Li","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053757616"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210099069","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":6.6882,"has_fulltext":false,"cited_by_count":57,"citation_normalized_percentile":{"value":0.97890428,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"6487","last_page":"6491"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.7813418507575989},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7019309997558594},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.6675088405609131},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.600297749042511},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5592736005783081},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5503572225570679},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5083126425743103},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4704025387763977},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.4682297110557556},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4185323715209961},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4166909456253052},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3743818402290344},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.23839795589447021},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.1491760015487671},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.10118156671524048},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.07751700282096863}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.7813418507575989},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7019309997558594},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.6675088405609131},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.600297749042511},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5592736005783081},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5503572225570679},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5083126425743103},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4704025387763977},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.4682297110557556},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4185323715209961},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4166909456253052},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3743818402290344},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.23839795589447021},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.1491760015487671},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10118156671524048},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.07751700282096863},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp43922.2022.9746432","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9746432","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7200000286102295,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W165956390","https://openalex.org/W1522301498","https://openalex.org/W1552314771","https://openalex.org/W1677182931","https://openalex.org/W1974387177","https://openalex.org/W2060108923","https://openalex.org/W2117678320","https://openalex.org/W2289394825","https://openalex.org/W2289480995","https://openalex.org/W2398042854","https://openalex.org/W2398972335","https://openalex.org/W2516001803","https://openalex.org/W2517616541","https://openalex.org/W2567070169","https://openalex.org/W2568308529","https://openalex.org/W2586584460","https://openalex.org/W2592384597","https://openalex.org/W2791568767","https://openalex.org/W2900893004","https://openalex.org/W2963970792","https://openalex.org/W2972802573","https://openalex.org/W2976510122","https://openalex.org/W3004309045","https://openalex.org/W3015312544","https://openalex.org/W3015372568","https://openalex.org/W3016094953","https://openalex.org/W3025800305","https://openalex.org/W3032514799","https://openalex.org/W3120336970","https://openalex.org/W3145364388","https://openalex.org/W3162341667","https://openalex.org/W3162493033","https://openalex.org/W3173999841","https://openalex.org/W3196360884","https://openalex.org/W3197260772","https://openalex.org/W3198511309","https://openalex.org/W3213188934","https://openalex.org/W6606758639","https://openalex.org/W6631190155","https://openalex.org/W6633117090","https://openalex.org/W6731370813","https://openalex.org/W6780226713"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2761785940","https://openalex.org/W2110523656","https://openalex.org/W1482209366","https://openalex.org/W2521627374"],"abstract_inverted_index":{"Standing":[0],"upon":[1],"the":[2,42,49,52,69,81,92,97,102,109,113],"intersection":[3],"of":[4,36,126],"traditional":[5],"beamformers":[6],"and":[7,20,22,31,108],"deep":[8],"neural":[9,15],"networks,":[10],"we":[11,100],"propose":[12],"a":[13,62,84,121],"causal":[14],"beamformer":[16],"paradigm":[17],"called":[18],"Embedding":[19],"Beamforming,":[21],"two":[23],"core":[24],"modules":[25],"are":[26],"devised":[27],"accordingly,":[28],"namely":[29],"EM":[30],"BM.":[32],"For":[33,60],"EM,":[34],"instead":[35],"estimating":[37],"spatial":[38],"covariance":[39],"matrix":[40],"explicitly,":[41],"3-D":[43],"embedding":[44],"tensor":[45],"is":[46,64,87],"learned":[47],"with":[48],"network,":[50],"where":[51],"spatial-spectral":[53],"discriminative":[54],"information":[55],"can":[56],"be":[57],"implicitly":[58],"represented.":[59],"BM,":[61],"network":[63],"directly":[65],"leveraged":[66],"to":[67,74,89],"derive":[68],"beamforming":[70],"weights":[71],"so":[72],"as":[73],"implement":[75],"filter-and-sum":[76],"operation.":[77],"To":[78],"further":[79,90],"improve":[80],"speech":[82,106],"quality,":[83],"post-processing":[85],"module":[86],"introduced":[88],"suppress":[91],"residual":[93],"noise.":[94],"Based":[95],"on":[96],"DNS-Challenge":[98],"dataset,":[99],"conduct":[101],"experiments":[103],"for":[104],"multichannel":[105],"enhancement":[107],"results":[110],"show":[111],"that":[112],"proposed":[114],"system":[115],"outperforms":[116],"previous":[117],"advanced":[118],"baselines":[119],"by":[120],"large":[122],"margin":[123],"in":[124],"terms":[125],"multiple":[127],"evaluation":[128],"metrics.":[129]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":17},{"year":2023,"cited_by_count":20},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
