{"id":"https://openalex.org/W3097653961","doi":"https://doi.org/10.21437/interspeech.2020-1397","title":"SpEx+: A Complete Time Domain Speaker Extraction Network","display_name":"SpEx+: A Complete Time Domain Speaker Extraction Network","publication_year":2020,"publication_date":"2020-10-25","ids":{"openalex":"https://openalex.org/W3097653961","doi":"https://doi.org/10.21437/interspeech.2020-1397","mag":"3097653961"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2020-1397","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-1397","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071074013","display_name":"Meng Ge","orcid":"https://orcid.org/0000-0003-2017-4529"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]},{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["CN","SG"],"is_corresponding":true,"raw_author_name":"Meng Ge","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103210439","display_name":"Chenglin Xu","orcid":"https://orcid.org/0000-0002-1584-6282"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]},{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Chenglin Xu","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore","Department of Electrical and Computer Engineering, National University of Singapore, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101745213","display_name":"Longbiao Wang","orcid":"https://orcid.org/0000-0002-8094-6861"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longbiao Wang","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070872826","display_name":"Eng Siong Chng","orcid":"https://orcid.org/0000-0001-6257-7399"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Eng Siong Chng","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017251198","display_name":"Jianwu Dang","orcid":"https://orcid.org/0000-0002-9237-4821"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]},{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN","JP"],"is_corresponding":false,"raw_author_name":"Jianwu Dang","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","Japan Advanced Institute of Science and Technology, Ishikawa, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"Japan Advanced Institute of Science and Technology, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]},{"id":"https://openalex.org/I180437899","display_name":"University of Bremen","ror":"https://ror.org/04ers2y35","country_code":"DE","type":"education","lineage":["https://openalex.org/I180437899"]}],"countries":["DE","SG"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore","Machine Listening Lab, University of Bremen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Machine Listening Lab, University of Bremen, Germany","institution_ids":["https://openalex.org/I180437899"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5071074013"],"corresponding_institution_ids":["https://openalex.org/I162868743","https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":9.5195,"has_fulltext":false,"cited_by_count":144,"citation_normalized_percentile":{"value":0.98429938,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1406","last_page":"1410"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6568083763122559},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.6483215093612671},{"id":"https://openalex.org/keywords/time-domain","display_name":"Time domain","score":0.5100651383399963},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5022127628326416},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.45838943123817444},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15514710545539856},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.10618570446968079},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.0990632176399231}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6568083763122559},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.6483215093612671},{"id":"https://openalex.org/C103824480","wikidata":"https://www.wikidata.org/wiki/Q185889","display_name":"Time domain","level":2,"score":0.5100651383399963},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5022127628326416},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45838943123817444},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15514710545539856},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.10618570446968079},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0990632176399231},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2020-1397","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-1397","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality","score":0.699999988079071}],"awards":[{"id":"https://openalex.org/G2425286661","display_name":null,"funder_award_id":"EXC 2077","funder_id":"https://openalex.org/F4320324729","funder_display_name":"Universit\u00e4t Bremen"},{"id":"https://openalex.org/G4464239203","display_name":null,"funder_award_id":"EXC 2077","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320324729","display_name":"Universit\u00e4t Bremen","ror":"https://ror.org/04ers2y35"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W2221409856","https://openalex.org/W2460742184","https://openalex.org/W2529093176","https://openalex.org/W2558649592","https://openalex.org/W2734774145","https://openalex.org/W2735663686","https://openalex.org/W2749510669","https://openalex.org/W2787692317","https://openalex.org/W2800022361","https://openalex.org/W2800664709","https://openalex.org/W2889029567","https://openalex.org/W2889540509","https://openalex.org/W2891405874","https://openalex.org/W2891833136","https://openalex.org/W2895807593","https://openalex.org/W2924115626","https://openalex.org/W2939771864","https://openalex.org/W2951130829","https://openalex.org/W2952218014","https://openalex.org/W2962715207","https://openalex.org/W2962905190","https://openalex.org/W2973054998","https://openalex.org/W2973062255","https://openalex.org/W3008400075","https://openalex.org/W3015199127","https://openalex.org/W3015636705","https://openalex.org/W3103434036","https://openalex.org/W3105928222"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W2359140296"],"abstract_inverted_index":{"Speaker":[0],"extraction":[1,91],"aims":[2],"to":[3],"extract":[4],"the":[5,27,55,59,65,79,99,109,116,121,130],"target":[6,15],"speech":[7,44,104],"signal":[8],"from":[9],"a":[10,14,21,37,87],"multi-talker":[11],"environment":[12],"given":[13],"speaker's":[16],"reference":[17],"speech.We":[18],"recently":[19],"proposed":[20],"time-domain":[22,38,43,89],"solution,":[23,92],"SpEx,":[24],"that":[25,93,120],"avoids":[26],"phase":[28],"estimation":[29],"in":[30],"frequency-domain":[31,51,68],"approaches.Unfortunately,":[32],"SpEx":[33,132],"is":[34,94],"not":[35],"fully":[36],"solution":[39],"since":[40],"it":[41],"performs":[42],"encoding":[45],"for":[46,62,67,108],"speaker":[47,52,90,117],"extraction,":[48],"while":[49],"taking":[50],"embedding":[53],"as":[54,113],"reference.The":[56],"size":[57,66],"of":[58,101,115],"analysis":[60],"window":[61],"timedomain":[63],"and":[64,125,136],"input":[69],"are":[70],"also":[71],"different.Such":[72],"mismatch":[73],"has":[74],"an":[75],"adverse":[76],"effect":[77],"on":[78,140],"system":[80],"performance.To":[81],"eliminate":[82],"such":[83],"mismatch,":[84],"we":[85,97],"propose":[86],"complete":[88],"called":[95],"SpEx+.Specifically,":[96],"tie":[98],"weights":[100],"two":[102],"identical":[103],"encoder":[105],"networks,":[106],"one":[107],"encoder-extractor-decoder":[110],"pipeline,":[111],"another":[112],"part":[114],"encoder.Experiments":[118],"show":[119],"SpEx+":[122],"achieves":[123],"0.8dB":[124],"2.1dB":[126],"SDR":[127],"improvement":[128],"over":[129],"state-of-the-art":[131],"baseline,":[133],"under":[134],"different":[135],"same":[137],"gender":[138],"conditions":[139],"WSJ0-2mix-extr":[141],"database":[142],"respectively.":[143]},"counts_by_year":[{"year":2026,"cited_by_count":10},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":37},{"year":2023,"cited_by_count":27},{"year":2022,"cited_by_count":22},{"year":2021,"cited_by_count":17},{"year":2020,"cited_by_count":4}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
