{"id":"https://openalex.org/W3200531652","doi":"https://doi.org/10.1109/asru51503.2021.9688126","title":"Conferencingspeech Challenge: Towards Far-Field Multi-Channel Speech Enhancement for Video Conferencing","display_name":"Conferencingspeech Challenge: Towards Far-Field Multi-Channel Speech Enhancement for Video Conferencing","publication_year":2021,"publication_date":"2021-12-13","ids":{"openalex":"https://openalex.org/W3200531652","doi":"https://doi.org/10.1109/asru51503.2021.9688126","mag":"3200531652"},"language":"en","primary_location":{"id":"doi:10.1109/asru51503.2021.9688126","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru51503.2021.9688126","pdf_url":null,"source":{"id":"https://openalex.org/S4363606113","display_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016229505","display_name":"Wei Rao","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Rao","raw_affiliation_strings":["Tencent Ethereal Audio Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010250251","display_name":"Yihui Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihui Fu","raw_affiliation_strings":["Northwestern Polytechnical University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University,China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101330960","display_name":"Yanxin Hu","orcid":"https://orcid.org/0009-0009-4388-8883"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanxin Hu","raw_affiliation_strings":["Northwestern Polytechnical University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University,China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038452997","display_name":"Xin Xu","orcid":"https://orcid.org/0000-0003-4625-5482"},"institutions":[{"id":"https://openalex.org/I7923278","display_name":"Shell (Netherlands)","ror":"https://ror.org/00b5m4j81","country_code":"NL","type":"company","lineage":["https://openalex.org/I7923278"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Xin Xu","raw_affiliation_strings":["Beijing Shell Shell Technology Co., LTD.,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Shell Shell Technology Co., LTD.,China","institution_ids":["https://openalex.org/I7923278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025176787","display_name":"Yvkai Jv","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yvkai Jv","raw_affiliation_strings":["Northwestern Polytechnical University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University,China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090367911","display_name":"Jiangyu Han","orcid":"https://orcid.org/0000-0001-5390-8520"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiangyu Han","raw_affiliation_strings":["Tencent Ethereal Audio Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101421603","display_name":"Zhongjie Jiang","orcid":"https://orcid.org/0009-0009-7256-6592"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongjie Jiang","raw_affiliation_strings":["Tencent Ethereal Audio Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066245750","display_name":"Lei Xie","orcid":"https://orcid.org/0000-0001-9051-2111"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Xie","raw_affiliation_strings":["Northwestern Polytechnical University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University,China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084128157","display_name":"Yannan Wang","orcid":"https://orcid.org/0000-0001-7248-4954"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yannan Wang","raw_affiliation_strings":["Tencent Ethereal Audio Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Carnegie Mellon University,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090108098","display_name":"Zheng\u2010Hua Tan","orcid":"https://orcid.org/0000-0001-6856-8928"},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Zheng-Hua Tan","raw_affiliation_strings":["Aalborg University,Denmark","Institut for Elektroniske Systemer"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]},{"raw_affiliation_string":"Institut for Elektroniske Systemer","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101791717","display_name":"Hui Bu","orcid":"https://orcid.org/0000-0003-1883-8496"},"institutions":[{"id":"https://openalex.org/I7923278","display_name":"Shell (Netherlands)","ror":"https://ror.org/00b5m4j81","country_code":"NL","type":"company","lineage":["https://openalex.org/I7923278"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Hui Bu","raw_affiliation_strings":["Beijing Shell Shell Technology Co., LTD.,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Shell Shell Technology Co., LTD.,China","institution_ids":["https://openalex.org/I7923278"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057697869","display_name":"Tao Yu","orcid":"https://orcid.org/0000-0002-0143-261X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao Yu","raw_affiliation_strings":["Tencent Ethereal Audio Lab,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078353046","display_name":"Shidong Shang","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shidong Shang","raw_affiliation_strings":["Tencent Ethereal Audio Lab,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Ethereal Audio Lab,China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":14,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5163,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.64285714,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"679","last_page":"686"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13905","display_name":"Telecommunications and Broadcasting Technologies","score":0.9107000231742859,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/videoconferencing","display_name":"Videoconferencing","score":0.5253964066505432},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4977283775806427},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.454274982213974},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.43332940340042114},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.3675382733345032},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0819101631641388}],"concepts":[{"id":"https://openalex.org/C22561748","wikidata":"https://www.wikidata.org/wiki/Q854954","display_name":"Videoconferencing","level":2,"score":0.5253964066505432},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4977283775806427},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.454274982213974},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.43332940340042114},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.3675382733345032},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0819101631641388},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/asru51503.2021.9688126","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru51503.2021.9688126","pdf_url":null,"source":{"id":"https://openalex.org/S4363606113","display_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:publications/e3d2e75c-f42b-4149-9b1a-20e9b61fe583","is_oa":false,"landing_page_url":"https://vbn.aau.dk/da/publications/e3d2e75c-f42b-4149-9b1a-20e9b61fe583","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Rao , W , Fu , Y , Hu , Y , Xu , X , Jv , Y , Han , J , Jiang , Z , Xie , L , Wang , Y , Watanabe , S , Tan , Z-H , Bu , H , Yu , T &amp; Shang , S 2021 , ConferencingSpeech Challenge : Towards Far-field Multi-Channel Speech Enhancement for Video Conferencing . in IEEE Automatic Speech Recognition and Understanding Workshop . , 9688126 , IEEE , IEEE Automatic Speech Recognition and Understanding Workshop , 13/12/2021 . https://doi.org/10.1109/ASRU51503.2021.9688126","raw_type":"contributionToPeriodical"},{"id":"mag:3200531652","is_oa":false,"landing_page_url":"https://vbn.aau.dk/en/publications/conferencingspeech-challenge-towards-far-field-multi-channel-spee","pdf_url":null,"source":{"id":"https://openalex.org/S4306418586","display_name":"IEEE Automatic Speech Recognition and Understanding Workshop","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Automatic Speech Recognition and Understanding Workshop","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1591607137","https://openalex.org/W1897240248","https://openalex.org/W2000221426","https://openalex.org/W2095072097","https://openalex.org/W2291877678","https://openalex.org/W2550397165","https://openalex.org/W2568308529","https://openalex.org/W2746457594","https://openalex.org/W2749335474","https://openalex.org/W2755891984","https://openalex.org/W2774425939","https://openalex.org/W2884797218","https://openalex.org/W2935934262","https://openalex.org/W2963040451","https://openalex.org/W2963242190","https://openalex.org/W3016232124","https://openalex.org/W3020336359","https://openalex.org/W3096408984","https://openalex.org/W3097224504","https://openalex.org/W3097263872","https://openalex.org/W3097906045","https://openalex.org/W3196343857","https://openalex.org/W3198027828","https://openalex.org/W3198511309","https://openalex.org/W4253928870","https://openalex.org/W6678809451","https://openalex.org/W6688816777","https://openalex.org/W6782481672","https://openalex.org/W6782486312"],"related_works":["https://openalex.org/W2359085723","https://openalex.org/W2365848060","https://openalex.org/W2834559563","https://openalex.org/W165648171","https://openalex.org/W2355142598","https://openalex.org/W2022846483","https://openalex.org/W2379194429","https://openalex.org/W1512065203","https://openalex.org/W1975548320","https://openalex.org/W2839185386","https://openalex.org/W13453321","https://openalex.org/W2043171225","https://openalex.org/W2059114595","https://openalex.org/W1492164297","https://openalex.org/W3127654951","https://openalex.org/W2042045798","https://openalex.org/W2004047800","https://openalex.org/W1581404964","https://openalex.org/W1962875467","https://openalex.org/W2378748680"],"abstract_inverted_index":{"The":[0,17,136,182],"ConferencingSpeech":[1],"2021":[2],"challenge":[3,18,87,141,180],"is":[4,27,47,57,150,186],"proposed":[5],"to":[6,74,131,157],"stimulate":[7],"research":[8],"on":[9,37],"far-field":[10],"multi-channel":[11,28,48],"speech":[12,29,49,77,119,163],"enhancement":[13,30,50],"for":[14,129],"video":[15,82],"conferencing.":[16],"consists":[19],"of":[20,105,115,139],"two":[21],"separate":[22],"tasks:":[23],"1)":[24],"Task":[25,45],"1":[26],"with":[31,40,51],"single":[32],"microphone":[33],"array":[34],"and":[35,43,61,94,120,125,166,179,194],"focusing":[36],"practical":[38],"application":[39],"real-time":[41],"requirement":[42],"2)":[44],"2":[46],"multiple":[52],"distributed":[53],"micro-phone":[54],"arrays,":[55],"which":[56,149,185],"a":[58,126,187],"non-real-time":[59],"track":[60],"does":[62],"not":[63],"have":[64],"any":[65,72],"constraints":[66],"so":[67],"that":[68],"participants":[69,130],"could":[70],"explore":[71],"algorithms":[73],"obtain":[75],"high":[76],"quality.":[78],"Targeting":[79],"the":[80,86,102,113,140,146,173],"real":[81,92,103],"conferencing":[83,106],"room":[84],"application,":[85],"database":[88],"was":[89],"recorded":[90],"from":[91],"speakers":[93],"all":[95],"recording":[96],"facilities":[97],"were":[98],"located":[99],"by":[100,145],"following":[101],"setup":[104],"room.":[107],"In":[108],"this":[109],"challenge,":[110,174],"we":[111],"open-sourced":[112],"list":[114],"open":[116],"source":[117],"clean":[118],"noise":[121,167],"datasets,":[122,176],"simulation":[123],"scripts,":[124],"baseline":[127,183],"system":[128,184],"develop":[132],"their":[133],"own":[134],"system.":[135],"final":[137],"ranking":[138],"will":[142],"be":[143],"decided":[144],"subjective":[147,177],"evaluation":[148],"performed":[151],"using":[152],"Absolute":[153],"Category":[154],"Ratings":[155],"(ACR)":[156],"estimate":[158],"Mean":[159],"Opinion":[160],"Score":[161],"(MOS),":[162],"MOS":[164,168],"(S-MOS),":[165],"(N-MOS).":[169],"This":[170],"paper":[171],"describes":[172],"tasks,":[175],"evaluation,":[178],"results.":[181],"complex":[188],"ratio":[189],"mask":[190],"based":[191],"neural":[192],"network":[193],"its":[195],"experimental":[196],"results":[197],"are":[198],"also":[199],"presented.":[200]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
