{"id":"https://openalex.org/W4392903873","doi":"https://doi.org/10.1109/icassp48485.2024.10447292","title":"All Neural Kronecker Product Beamforming for Speech Extraction with Large-Scale Microphone Arrays","display_name":"All Neural Kronecker Product Beamforming for Speech Extraction with Large-Scale Microphone Arrays","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392903873","doi":"https://doi.org/10.1109/icassp48485.2024.10447292"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10447292","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447292","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104319380","display_name":"Weixin Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weixin Meng","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100449152","display_name":"Xiaoyu Li","orcid":"https://orcid.org/0000-0002-3222-0513"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyu Li","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053757616","display_name":"Andong Li","orcid":"https://orcid.org/0000-0003-4094-8448"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Andong Li","raw_affiliation_strings":["Tencent AI Lab,Beijing,China","Tencent AI Lab, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab,Beijing,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent AI Lab, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100402534","display_name":"Jian Li","orcid":"https://orcid.org/0000-0002-7521-8798"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Li","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","University of Chinese Academy of Sciences, Beijing, China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100711527","display_name":"Xiaodong Li","orcid":"https://orcid.org/0000-0002-4170-0076"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Li","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Key Laboratory of Noise and Vibration Research, Institute of Acoustics,Beijing,China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5104319380"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210099069","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.3604,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.48876672,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"106","issue":null,"first_page":"8566","last_page":"8570"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7592953443527222},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.6424559354782104},{"id":"https://openalex.org/keywords/microphone-array","display_name":"Microphone array","score":0.5832717418670654},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5407137870788574},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5215280055999756},{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.5108625292778015},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.5046623945236206},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.47222259640693665},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.46161115169525146},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43085604906082153},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3702036142349243},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36241501569747925}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7592953443527222},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.6424559354782104},{"id":"https://openalex.org/C2778806681","wikidata":"https://www.wikidata.org/wiki/Q907293","display_name":"Microphone array","level":4,"score":0.5832717418670654},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5407137870788574},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5215280055999756},{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.5108625292778015},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.5046623945236206},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.47222259640693665},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.46161115169525146},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43085604906082153},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3702036142349243},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36241501569747925},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10447292","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447292","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5249178904","display_name":null,"funder_award_id":"Grant No. 6","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7943112371","display_name":null,"funder_award_id":"62001467","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1552314771","https://openalex.org/W2066218102","https://openalex.org/W2094287371","https://openalex.org/W2117678320","https://openalex.org/W2150678643","https://openalex.org/W2289480995","https://openalex.org/W2398042854","https://openalex.org/W2507598686","https://openalex.org/W2516001803","https://openalex.org/W2791568767","https://openalex.org/W2890553422","https://openalex.org/W2952218014","https://openalex.org/W2991361823","https://openalex.org/W3015599456","https://openalex.org/W3017942586","https://openalex.org/W3025800305","https://openalex.org/W3032514799","https://openalex.org/W3099330747","https://openalex.org/W3120336970","https://openalex.org/W3162341667","https://openalex.org/W3197042120","https://openalex.org/W4210402803","https://openalex.org/W4221164004","https://openalex.org/W4247128071","https://openalex.org/W4312219134","https://openalex.org/W4313443698","https://openalex.org/W4322717140","https://openalex.org/W4372337752","https://openalex.org/W4388620484","https://openalex.org/W6631190155","https://openalex.org/W6785764544","https://openalex.org/W6799760327","https://openalex.org/W6849772234"],"related_works":["https://openalex.org/W2896203542","https://openalex.org/W201299990","https://openalex.org/W876328409","https://openalex.org/W4319068615","https://openalex.org/W1879255185","https://openalex.org/W2148473678","https://openalex.org/W3004719695","https://openalex.org/W2120442551","https://openalex.org/W2769861442","https://openalex.org/W1980506188"],"abstract_inverted_index":{"Existing":[0],"frame-wise":[1],"neural":[2,84],"beamformers":[3,125],"for":[4,58,126],"speech":[5,88],"extraction":[6,89],"can":[7],"obtain":[8],"promising":[9],"performance":[10,27,90],"in":[11,29,91,143,170],"relatively":[12,30],"high":[13,69],"signal-to-noise":[14],"ratio":[15],"(SNR)":[16],"scenarios":[17],"using":[18,155],"small":[19,121],"microphone":[20,60,74],"arrays,":[21],"while":[22],"they":[23],"still":[24],"suffer":[25],"from":[26],"degradation":[28],"low":[31],"SNR":[32],"environments,":[33],"e.g.,":[34],"SNR<-5":[35],"dB.":[36],"As":[37],"an":[38,47,144],"attempt":[39],"to":[40,66,86,97,113,141],"solve":[41],"this":[42,44,95],"problem,":[43],"paper":[45],"proposes":[46],"all-neural":[48],"beamformer":[49],"based":[50],"on":[51,150],"Kronecker":[52,110],"product":[53,111],"decomposition,":[54],"denoted":[55],"by":[56],"NeuKP-BF,":[57],"large-scale":[59,117],"arrays.":[61],"The":[62,136,159],"core":[63],"idea":[64],"is":[65],"incorporate":[67],"the":[68,77,99,105,109,115,127,152,156,163],"spatial":[70],"resolution":[71],"of":[72,82,172],"large":[73],"arrays":[75],"and":[76,103,124,133],"powerful":[78],"non-linear":[79],"modeling":[80],"capability":[81],"deep":[83],"networks":[85],"improve":[87,104],"challenging":[92],"environments.":[93],"In":[94],"paper,":[96],"reduce":[98],"feature":[100],"representation":[101],"redundancy":[102],"interpretability,":[106],"we":[107],"used":[108],"rule":[112],"decompose":[114],"original":[116],"array":[118],"into":[119],"two":[120,128],"virtual":[122],"subarrays,":[123],"subarrays":[129],"were":[130,148],"then":[131],"designed":[132,140],"merged":[134],"finally.":[135],"whole":[137],"system":[138],"was":[139],"implement":[142],"end-to-end":[145],"manner.":[146],"Experiments":[147],"conducted":[149],"both":[151],"synthesized":[153],"data":[154],"DNS-Challenge":[157],"corpus.":[158],"results":[160],"showed":[161],"that":[162],"proposed":[164],"approach":[165],"outperformed":[166],"existing":[167],"advanced":[168],"baselines":[169],"terms":[171],"multiple":[173],"objective":[174],"metrics.":[175]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
