{"id":"https://openalex.org/W4402474782","doi":"https://doi.org/10.1109/taslp.2024.3459430","title":"Deep Kronecker Product Beamforming for Large-Scale Microphone Arrays","display_name":"Deep Kronecker Product Beamforming for Large-Scale Microphone Arrays","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402474782","doi":"https://doi.org/10.1109/taslp.2024.3459430"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3459430","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3459430","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104319380","display_name":"Weixin Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weixin Meng","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100449152","display_name":"Xiaoyu Li","orcid":"https://orcid.org/0000-0002-3222-0513"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyu Li","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053757616","display_name":"Andong Li","orcid":"https://orcid.org/0000-0003-4094-8448"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Andong Li","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090663707","display_name":"Xiaoxue Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxue Luo","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034998288","display_name":"Shefeng Yan","orcid":"https://orcid.org/0000-0003-3343-9434"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shefeng Yan","raw_affiliation_strings":["Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100711527","display_name":"Xiaodong Li","orcid":"https://orcid.org/0000-0002-4170-0076"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Li","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5104319380"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210099069"],"apc_list":null,"apc_paid":null,"fwci":2.453,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.90116187,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"32","issue":null,"first_page":"4537","last_page":"4553"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9083999991416931,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9017000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.6568033695220947},{"id":"https://openalex.org/keywords/kronecker-product","display_name":"Kronecker product","score":0.6512521505355835},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6018840074539185},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5933446884155273},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.4701024889945984},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43670088052749634},{"id":"https://openalex.org/keywords/kronecker-delta","display_name":"Kronecker delta","score":0.3626987040042877},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.33456122875213623},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2784385681152344},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.187884122133255},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.13026100397109985},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.12041980028152466},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.11915504932403564},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.08493191003799438}],"concepts":[{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.6568033695220947},{"id":"https://openalex.org/C46030957","wikidata":"https://www.wikidata.org/wiki/Q1238125","display_name":"Kronecker product","level":3,"score":0.6512521505355835},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6018840074539185},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5933446884155273},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.4701024889945984},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43670088052749634},{"id":"https://openalex.org/C39482219","wikidata":"https://www.wikidata.org/wiki/Q192826","display_name":"Kronecker delta","level":2,"score":0.3626987040042877},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.33456122875213623},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2784385681152344},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.187884122133255},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13026100397109985},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.12041980028152466},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.11915504932403564},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.08493191003799438},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2024.3459430","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3459430","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1594344483","https://openalex.org/W1974387177","https://openalex.org/W2024490156","https://openalex.org/W2037117129","https://openalex.org/W2066218102","https://openalex.org/W2093225945","https://openalex.org/W2093983253","https://openalex.org/W2100375013","https://openalex.org/W2117678320","https://openalex.org/W2119528437","https://openalex.org/W2140435203","https://openalex.org/W2143946906","https://openalex.org/W2144027068","https://openalex.org/W2150278512","https://openalex.org/W2150678643","https://openalex.org/W2273819057","https://openalex.org/W2289480995","https://openalex.org/W2398972335","https://openalex.org/W2400339399","https://openalex.org/W2507598686","https://openalex.org/W2516001803","https://openalex.org/W2517616541","https://openalex.org/W2617566018","https://openalex.org/W2640112133","https://openalex.org/W2762264186","https://openalex.org/W2899943749","https://openalex.org/W2914883047","https://openalex.org/W2921875322","https://openalex.org/W2944368176","https://openalex.org/W2952218014","https://openalex.org/W2991361823","https://openalex.org/W3015372568","https://openalex.org/W3017942586","https://openalex.org/W3025800305","https://openalex.org/W3032514799","https://openalex.org/W3087954328","https://openalex.org/W3106603336","https://openalex.org/W3120336970","https://openalex.org/W3136499730","https://openalex.org/W3137714272","https://openalex.org/W3144062511","https://openalex.org/W3153985003","https://openalex.org/W3162341667","https://openalex.org/W3192281612","https://openalex.org/W3197042120","https://openalex.org/W3210597831","https://openalex.org/W4205955626","https://openalex.org/W4210402803","https://openalex.org/W4221164004","https://openalex.org/W4225302959","https://openalex.org/W4245049843","https://openalex.org/W4247128071","https://openalex.org/W4295832084","https://openalex.org/W4307721316","https://openalex.org/W4312219134","https://openalex.org/W4312806213","https://openalex.org/W4313443698","https://openalex.org/W4372337752","https://openalex.org/W4372347386","https://openalex.org/W4382366223","https://openalex.org/W4385692894","https://openalex.org/W4385822364","https://openalex.org/W4385989146","https://openalex.org/W4388620484","https://openalex.org/W4391024977","https://openalex.org/W4392903873","https://openalex.org/W4402316486","https://openalex.org/W6631190155","https://openalex.org/W6791006086"],"related_works":["https://openalex.org/W123417539","https://openalex.org/W4233239985","https://openalex.org/W2079407403","https://openalex.org/W2060299328","https://openalex.org/W2117336295","https://openalex.org/W2073634779","https://openalex.org/W3102722572","https://openalex.org/W2090103374","https://openalex.org/W1564288589","https://openalex.org/W577870507"],"abstract_inverted_index":{"Although":[0],"deep":[1,92,146],"learning":[2],"based":[3],"beamformers":[4,52,93],"have":[5],"achieved":[6],"promising":[7],"performance":[8,16,50,90,134,239],"using":[9,213],"small":[10,142],"microphone":[11,39,116,129,143],"arrays,":[12],"they":[13],"suffer":[14],"from":[15],"degradation":[17],"in":[18,53,67,78,97,157,200,224,254,261],"very":[19,98,262],"challenging":[20,55,99],"environments,":[21,29],"such":[22],"as":[23],"extremely":[24],"low":[25,263],"Signal-to-Noise":[26],"Ratio":[27],"(SNR)":[28],"e.g.,":[30],"SNR":[31,264],"<inline-formula":[32],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[33],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[34],"notation=\"LaTeX\">$\\le$</tex-math></inline-formula>\u221210":[35],"dB.":[36],"A":[37],"large-scale":[38,115,210],"array":[40,130],"with":[41,140],"dozens":[42],"or":[43],"hundreds":[44],"of":[45,51,58,70,91,135,187,240,256],"microphones":[46,71],"can":[47,131],"improve":[48,88],"the":[49,68,89,120,158,163,171,177,184,214,221,238,247],"these":[54],"scenarios":[56],"because":[57],"its":[59],"high":[60],"spatial":[61,136],"resolution.":[62],"While":[63],"a":[64,104,127,141,225],"dramatic":[65],"increase":[66],"number":[69],"leads":[72],"to":[73,87,175,198,234],"feature":[74,79,164],"redundancy,":[75],"causing":[76],"difficulties":[77],"extraction":[80,96,160],"and":[81,145,217,220,228,236],"network":[82],"training.":[83],"As":[84],"an":[85,201],"attempt":[86],"for":[94,114,151],"speech":[95,159],"scenarios,":[100],"this":[101],"paper":[102],"proposes":[103],"novel":[105],"all":[106],"neural":[107,147],"Kronecker":[108,172,185],"product":[109,173,186],"beamforming":[110],"denoted":[111],"by":[112,118,169],"ANKP-BF":[113,195],"arrays":[117],"taking":[119],"following":[121],"two":[122,188],"aspects":[123],"into":[124,183],"account.":[125],"Firstly,":[126],"larger":[128],"provide":[132],"higher":[133],"filtering":[137],"when":[138],"compared":[139],"array,":[144],"networks":[148],"are":[149,206,231],"introduced":[150],"their":[152],"powerful":[153],"non-linear":[154],"modeling":[155],"capability":[156],"task.":[161],"Secondly,":[162],"redundancy":[165],"problem":[166],"is":[167,196],"solved":[168],"introducing":[170],"rule":[174],"decompose":[176],"original":[178],"one":[179],"high-dimension":[180],"weight":[181,191],"vector":[182],"much":[189],"lower-dimensional":[190],"vectors.":[192],"The":[193],"proposed":[194,248],"designed":[197],"operate":[199],"end-to-end":[202],"manner.":[203],"Extensive":[204],"experiments":[205],"conducted":[207],"on":[208],"simulated":[209],"microphone-array":[211],"signals":[212],"DNS-Challenge":[215],"corpus":[216],"WSJ0-SI84":[218],"corpus,":[219],"real":[222],"recordings":[223],"semi-anechoic":[226],"room":[227],"outdoor":[229],"scenes":[230],"also":[232],"used":[233],"evaluate":[235],"compare":[237],"different":[241],"methods.":[242],"Quantitative":[243],"results":[244],"demonstrate":[245],"that":[246],"method":[249],"outperforms":[250],"existing":[251],"advanced":[252],"baselines":[253],"terms":[255],"multiple":[257],"objective":[258],"metrics,":[259],"especially":[260],"environments.":[265]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
