{"id":"https://openalex.org/W4316813147","doi":"https://doi.org/10.3390/sym15020261","title":"A Pre-Separation and All-Neural Beamformer Framework for Multi-Channel Speech Separation","display_name":"A Pre-Separation and All-Neural Beamformer Framework for Multi-Channel Speech Separation","publication_year":2023,"publication_date":"2023-01-17","ids":{"openalex":"https://openalex.org/W4316813147","doi":"https://doi.org/10.3390/sym15020261"},"language":"en","primary_location":{"id":"doi:10.3390/sym15020261","is_oa":true,"landing_page_url":"https://doi.org/10.3390/sym15020261","pdf_url":"https://www.mdpi.com/2073-8994/15/2/261/pdf?version=1673951335","source":{"id":"https://openalex.org/S190787756","display_name":"Symmetry","issn_l":"2073-8994","issn":["2073-8994"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Symmetry","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2073-8994/15/2/261/pdf?version=1673951335","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022198380","display_name":"Wupeng Xie","orcid":"https://orcid.org/0000-0002-4319-9326"},"institutions":[{"id":"https://openalex.org/I2800372957","display_name":"China Electronics Technology Group Corporation","ror":"https://ror.org/0098hst83","country_code":"CN","type":"company","lineage":["https://openalex.org/I2800372957"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wupeng Xie","raw_affiliation_strings":["Information Science Academy, China Electronics Technology Group Corporation, Beijing 100041, China"],"affiliations":[{"raw_affiliation_string":"Information Science Academy, China Electronics Technology Group Corporation, Beijing 100041, China","institution_ids":["https://openalex.org/I2800372957"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007226235","display_name":"Xiaoxiao Xiang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxiao Xiang","raw_affiliation_strings":["Aerospace Information Research Institute, Chinese Academy of Sciences, Beijing 100190, China","Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing 100190, China","School of Electronic, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing 100049, China"],"affiliations":[{"raw_affiliation_string":"Aerospace Information Research Institute, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210137199","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Electronic, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing 100049, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100457255","display_name":"Xiaojuan Zhang","orcid":"https://orcid.org/0000-0002-1543-0025"},"institutions":[{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojuan Zhang","raw_affiliation_strings":["Aerospace Information Research Institute, Chinese Academy of Sciences, Beijing 100190, China","Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Aerospace Information Research Institute, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210137199","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Electromagnetic Radiation and Sensing Technology, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071330051","display_name":"Guanghong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I2800372957","display_name":"China Electronics Technology Group Corporation","ror":"https://ror.org/0098hst83","country_code":"CN","type":"company","lineage":["https://openalex.org/I2800372957"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanghong Liu","raw_affiliation_strings":["Information Science Academy, China Electronics Technology Group Corporation, Beijing 100041, China"],"affiliations":[{"raw_affiliation_string":"Information Science Academy, China Electronics Technology Group Corporation, Beijing 100041, China","institution_ids":["https://openalex.org/I2800372957"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5022198380"],"corresponding_institution_ids":["https://openalex.org/I2800372957"],"apc_list":{"value":2000,"currency":"CHF","value_usd":2165},"apc_paid":{"value":2000,"currency":"CHF","value_usd":2165},"fwci":0.61,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.61914001,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"15","issue":"2","first_page":"261","last_page":"261"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.7607560157775879},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.737448513507843},{"id":"https://openalex.org/keywords/microphone-array","display_name":"Microphone array","score":0.6458752155303955},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.6234185099601746},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5621917247772217},{"id":"https://openalex.org/keywords/adaptive-beamformer","display_name":"Adaptive beamformer","score":0.5501337051391602},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5092869997024536},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5071172714233398},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.48430028557777405},{"id":"https://openalex.org/keywords/minimum-variance-unbiased-estimator","display_name":"Minimum-variance unbiased estimator","score":0.4810919463634491},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.46971574425697327},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.46393898129463196},{"id":"https://openalex.org/keywords/separation-method","display_name":"Separation method","score":0.4433770477771759},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25130248069763184},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17228659987449646},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.12264800071716309},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.10489481687545776},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.07590034604072571}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.7607560157775879},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.737448513507843},{"id":"https://openalex.org/C2778806681","wikidata":"https://www.wikidata.org/wiki/Q907293","display_name":"Microphone array","level":4,"score":0.6458752155303955},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.6234185099601746},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5621917247772217},{"id":"https://openalex.org/C33378366","wikidata":"https://www.wikidata.org/wiki/Q4680719","display_name":"Adaptive beamformer","level":3,"score":0.5501337051391602},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5092869997024536},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5071172714233398},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.48430028557777405},{"id":"https://openalex.org/C165646398","wikidata":"https://www.wikidata.org/wiki/Q3755281","display_name":"Minimum-variance unbiased estimator","level":3,"score":0.4810919463634491},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.46971574425697327},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.46393898129463196},{"id":"https://openalex.org/C3018256011","wikidata":"https://www.wikidata.org/wiki/Q898987","display_name":"Separation method","level":2,"score":0.4433770477771759},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25130248069763184},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17228659987449646},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.12264800071716309},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10489481687545776},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.07590034604072571},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/sym15020261","is_oa":true,"landing_page_url":"https://doi.org/10.3390/sym15020261","pdf_url":"https://www.mdpi.com/2073-8994/15/2/261/pdf?version=1673951335","source":{"id":"https://openalex.org/S190787756","display_name":"Symmetry","issn_l":"2073-8994","issn":["2073-8994"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Symmetry","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2fbc0031349849bdbe8630925c3734f7","is_oa":true,"landing_page_url":"https://doaj.org/article/2fbc0031349849bdbe8630925c3734f7","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Symmetry, Vol 15, Iss 2, p 261 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2073-8994/15/2/261/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/sym15020261","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Symmetry","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/sym15020261","is_oa":true,"landing_page_url":"https://doi.org/10.3390/sym15020261","pdf_url":"https://www.mdpi.com/2073-8994/15/2/261/pdf?version=1673951335","source":{"id":"https://openalex.org/S190787756","display_name":"Symmetry","issn_l":"2073-8994","issn":["2073-8994"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Symmetry","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6600000262260437}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4316813147.pdf"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1552314771","https://openalex.org/W1677182931","https://openalex.org/W1974387177","https://openalex.org/W2069681747","https://openalex.org/W2119438736","https://openalex.org/W2141998673","https://openalex.org/W2147665979","https://openalex.org/W2517616541","https://openalex.org/W2714487941","https://openalex.org/W2734774145","https://openalex.org/W2900893004","https://openalex.org/W2952218014","https://openalex.org/W2963177459","https://openalex.org/W2972460025","https://openalex.org/W2973231102","https://openalex.org/W2991361823","https://openalex.org/W3004309045","https://openalex.org/W3015372568","https://openalex.org/W3015679215","https://openalex.org/W3016094953","https://openalex.org/W3016257794","https://openalex.org/W3032514799","https://openalex.org/W3041647828","https://openalex.org/W3097906045","https://openalex.org/W3099330747","https://openalex.org/W3110852964","https://openalex.org/W3134695619","https://openalex.org/W3162341667","https://openalex.org/W3162493033","https://openalex.org/W3162539493","https://openalex.org/W3165227983","https://openalex.org/W3171278394","https://openalex.org/W3175083350","https://openalex.org/W3196360884","https://openalex.org/W3196940724","https://openalex.org/W3205004157","https://openalex.org/W3212231398","https://openalex.org/W4210402803","https://openalex.org/W4285170242","https://openalex.org/W4295308648","https://openalex.org/W6631190155"],"related_works":["https://openalex.org/W2392382502","https://openalex.org/W1589665459","https://openalex.org/W4205442640","https://openalex.org/W1982764159","https://openalex.org/W2393615245","https://openalex.org/W2348931051","https://openalex.org/W2168445433","https://openalex.org/W1999288241","https://openalex.org/W3133250934","https://openalex.org/W2015868395"],"abstract_inverted_index":{"Thanks":[0],"to":[1,88,103],"the":[2,51,54,59,68,75,79,99,110,118,133],"use":[3],"of":[4,53,117],"deep":[5],"neural":[6,21],"networks":[7],"(DNNs),":[8],"microphone":[9],"array":[10],"speech":[11,47,91,120,124],"separation":[12,48,121,129],"methods":[13,23],"have":[14],"achieved":[15],"impressive":[16],"performance.":[17,33],"However,":[18],"most":[19],"existing":[20],"beamforming":[22,81,101,106],"explicitly":[24],"follow":[25],"traditional":[26],"beamformer":[27,41],"formulas,":[28],"which":[29,94],"possibly":[30],"causes":[31],"sub-optimal":[32],"In":[34],"this":[35,144],"study,":[36],"a":[37],"pre-separation":[38,76,84],"and":[39,78,92,127],"all-neural":[40,80,100],"framework":[42,70],"is":[43,86,136],"proposed":[44,69,134],"for":[45,149],"multi-channel":[46,119],"without":[49,108],"following":[50],"solutions":[52],"conventional":[55],"beamformers,":[56],"such":[57],"as":[58],"minimum":[60],"variance":[61],"distortionless":[62],"response":[63],"(MVDR)":[64],"beamformer.":[65],"More":[66],"specifically,":[67],"includes":[71],"two":[72],"modules,":[73],"namely":[74],"module":[77,85,102],"module.":[82],"The":[83,114],"used":[87,148],"obtain":[89,104],"pre-separated":[90],"interference,":[93],"are":[95],"further":[96],"utilized":[97],"by":[98],"frame-level":[105],"weights":[107],"computing":[109],"spatial":[111],"covariance":[112],"matrices.":[113],"evaluation":[115],"results":[116],"tasks,":[122],"including":[123],"enhancement":[125],"subtasks":[126],"speaker":[128],"subtasks,":[130],"demonstrate":[131],"that":[132],"method":[135,145],"more":[137],"effective":[138],"than":[139],"several":[140],"advanced":[141],"baselines.":[142],"Furthermore,":[143],"can":[146],"be":[147],"symmetrical":[150],"stereo":[151],"speech.":[152]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
