{"id":"https://openalex.org/W3191555358","doi":"https://doi.org/10.1109/taslp.2021.3101617","title":"Monaural Speech Separation Using Speaker Embedding From Preliminary Separation","display_name":"Monaural Speech Separation Using Speaker Embedding From Preliminary Separation","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3191555358","doi":"https://doi.org/10.1109/taslp.2021.3101617","mag":"3191555358"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3101617","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3101617","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034409385","display_name":"Jaeuk Byun","orcid":"https://orcid.org/0000-0002-2974-7058"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jaeuk Byun","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, Korea","institution_ids":["https://openalex.org/I39534123"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054155133","display_name":"Jong Won Shin","orcid":"https://orcid.org/0000-0002-8910-0264"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jong Won Shin","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, Korea","institution_ids":["https://openalex.org/I39534123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5034409385"],"corresponding_institution_ids":["https://openalex.org/I39534123"],"apc_list":null,"apc_paid":null,"fwci":1.5236,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.83157539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"29","issue":null,"first_page":"2753","last_page":"2763"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.7699146270751953},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6748576760292053},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6445057392120361},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6237988471984863},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.5496767163276672},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5184511542320251},{"id":"https://openalex.org/keywords/affine-transformation","display_name":"Affine transformation","score":0.4562559723854065},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.44975394010543823},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3924775719642639},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3664781451225281},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19908103346824646},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.14254048466682434},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10660380125045776}],"concepts":[{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.7699146270751953},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6748576760292053},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6445057392120361},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6237988471984863},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.5496767163276672},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5184511542320251},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.4562559723854065},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.44975394010543823},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3924775719642639},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3664781451225281},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19908103346824646},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.14254048466682434},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10660380125045776},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3101617","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3101617","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G5023790827","display_name":null,"funder_award_id":"NRF-2019R1A2C2089324","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1522301498","https://openalex.org/W1677182931","https://openalex.org/W1836465849","https://openalex.org/W1997528538","https://openalex.org/W2077799289","https://openalex.org/W2134706965","https://openalex.org/W2194775991","https://openalex.org/W2221409856","https://openalex.org/W2344461865","https://openalex.org/W2479176461","https://openalex.org/W2609317876","https://openalex.org/W2610852352","https://openalex.org/W2669032454","https://openalex.org/W2734498959","https://openalex.org/W2734774145","https://openalex.org/W2735663686","https://openalex.org/W2760103357","https://openalex.org/W2794506738","https://openalex.org/W2808631503","https://openalex.org/W2890964092","https://openalex.org/W2947942791","https://openalex.org/W2952218014","https://openalex.org/W2958305995","https://openalex.org/W2962898354","https://openalex.org/W2962935966","https://openalex.org/W2963177459","https://openalex.org/W2963371159","https://openalex.org/W2963403868","https://openalex.org/W2963420686","https://openalex.org/W2963452667","https://openalex.org/W2963843276","https://openalex.org/W2964058413","https://openalex.org/W2964121744","https://openalex.org/W2971458685","https://openalex.org/W2971704668","https://openalex.org/W2971758476","https://openalex.org/W2972460025","https://openalex.org/W2978032182","https://openalex.org/W2981436548","https://openalex.org/W2990666817","https://openalex.org/W3008880747","https://openalex.org/W3013020904","https://openalex.org/W3015199127","https://openalex.org/W3015306128","https://openalex.org/W3015372568","https://openalex.org/W3016048045","https://openalex.org/W3016232124","https://openalex.org/W3022595508","https://openalex.org/W3035268204","https://openalex.org/W3042857426","https://openalex.org/W3049505819","https://openalex.org/W3089552252","https://openalex.org/W3094607766","https://openalex.org/W3095717210","https://openalex.org/W3096084197","https://openalex.org/W3096796823","https://openalex.org/W3097609423","https://openalex.org/W3097653961","https://openalex.org/W3097797867","https://openalex.org/W3099330747","https://openalex.org/W3108962419","https://openalex.org/W3112893973","https://openalex.org/W3124972797","https://openalex.org/W3160903688","https://openalex.org/W3162347631","https://openalex.org/W3163287738","https://openalex.org/W3163652268","https://openalex.org/W3165246035","https://openalex.org/W3196595845","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6638667902","https://openalex.org/W6739901393","https://openalex.org/W6740674931","https://openalex.org/W6751512325","https://openalex.org/W6767677336","https://openalex.org/W6774995033","https://openalex.org/W6784297428","https://openalex.org/W6784351597","https://openalex.org/W6784764134","https://openalex.org/W6786127183","https://openalex.org/W6791167661","https://openalex.org/W6795993601"],"related_works":["https://openalex.org/W2036157531","https://openalex.org/W2056406069","https://openalex.org/W1974981856","https://openalex.org/W1518859147","https://openalex.org/W2045506488","https://openalex.org/W1983045063","https://openalex.org/W2103031592","https://openalex.org/W1967226023","https://openalex.org/W2955471771","https://openalex.org/W2077498359"],"abstract_inverted_index":{"In":[0,55],"speech":[1,61],"separation,":[2],"the":[3,6,17,28,42,52,65,69,77,83,87,94,103,111,124,136,145,150],"identities":[4],"of":[5,86,98,116,130,152,160],"speakers":[7],"may":[8],"be":[9],"an":[10,32],"important":[11],"cue":[12],"to":[13,122,135],"discriminate":[14],"speeches":[15],"in":[16,68,93],"mixture":[18,53],"and":[19,114],"separate":[20],"them":[21],"better.":[22],"A":[23],"few":[24],"recent":[25],"researches":[26],"used":[27,46],"speaker":[29,44,48,66,125],"embedding":[30,49,67],"as":[31,102,127],"additional":[33,161],"information,":[34],"but":[35],"they":[36],"often":[37],"require":[38],"prior":[39],"information":[40,126],"about":[41],"target":[43],"or":[45,110,133],"noisy":[47],"extracted":[50,75],"from":[51,76],"signal.":[54],"this":[56],"article,":[57],"we":[58],"propose":[59],"monaural":[60],"separation":[62,107,154],"that":[63,144],"utilizes":[64],"later":[70,91],"separator":[71,88,95],"blocks,":[72],"which":[73],"is":[74],"intermediate":[78],"separated":[79],"results":[80,142],"obtained":[81],"by":[82],"early":[84],"stages":[85],"network.":[89],"The":[90,140],"blocks":[92,100],"networks":[96],"consisting":[97],"repeated":[99],"such":[101],"fully-convolutional":[104],"time-domain":[105],"audio":[106],"network":[108],"(Conv-TasNet)":[109],"successive":[112],"downsampling":[113],"resampling":[115],"multi-resolution":[117],"features":[118],"(SuDoRM-RF)":[119],"are":[120],"modified":[121],"take":[123],"a":[128,157],"form":[129],"affine":[131],"transformation":[132],"addition":[134],"original":[137],"input":[138],"tensor.":[139],"experimental":[141],"showed":[143],"proposed":[146],"methods":[147],"significantly":[148],"improved":[149],"performances":[151],"existing":[153],"systems":[155],"with":[156],"moderate":[158],"number":[159],"parameters.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
