{"id":"https://openalex.org/W4386320488","doi":"https://doi.org/10.1109/lsp.2023.3310881","title":"On Training Speech Separation Models With Various Numbers of Speakers","display_name":"On Training Speech Separation Models With Various Numbers of Speakers","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386320488","doi":"https://doi.org/10.1109/lsp.2023.3310881"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2023.3310881","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3310881","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087125607","display_name":"Hyeon-seung Kim","orcid":"https://orcid.org/0009-0003-0366-4611"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hyeonseung Kim","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, South Korea","institution_ids":["https://openalex.org/I39534123"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054155133","display_name":"Jong Won Shin","orcid":"https://orcid.org/0000-0002-8910-0264"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jong Won Shin","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, Gwangju Institute of Science and Technology, Gwangju, South Korea","institution_ids":["https://openalex.org/I39534123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5087125607"],"corresponding_institution_ids":["https://openalex.org/I39534123"],"apc_list":null,"apc_paid":null,"fwci":0.4066,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57100832,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"30","issue":null,"first_page":"1202","last_page":"1206"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.8028837442398071},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7117273807525635},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.6970386505126953},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.6800188422203064},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6066368222236633},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5998519062995911},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.4895933270454407},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.43655940890312195},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.411720335483551},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3359411954879761},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.335274338722229},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3264448344707489},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.21164315938949585}],"concepts":[{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.8028837442398071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7117273807525635},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.6970386505126953},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.6800188422203064},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6066368222236633},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5998519062995911},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.4895933270454407},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.43655940890312195},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.411720335483551},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3359411954879761},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.335274338722229},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3264448344707489},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.21164315938949585},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2023.3310881","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3310881","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W80444264","https://openalex.org/W2060822897","https://openalex.org/W2124149378","https://openalex.org/W2168379380","https://openalex.org/W2221409856","https://openalex.org/W2510642588","https://openalex.org/W2567070169","https://openalex.org/W2734774145","https://openalex.org/W2735663686","https://openalex.org/W2808479354","https://openalex.org/W2891054259","https://openalex.org/W2952218014","https://openalex.org/W2962715207","https://openalex.org/W2962935966","https://openalex.org/W2963263347","https://openalex.org/W2963773971","https://openalex.org/W2964058413","https://openalex.org/W2972460025","https://openalex.org/W2972767900","https://openalex.org/W3004309045","https://openalex.org/W3013934216","https://openalex.org/W3015199127","https://openalex.org/W3015372568","https://openalex.org/W3016094953","https://openalex.org/W3016232124","https://openalex.org/W3016257794","https://openalex.org/W3032969657","https://openalex.org/W3035268204","https://openalex.org/W3042857426","https://openalex.org/W3094607766","https://openalex.org/W3094893851","https://openalex.org/W3095831308","https://openalex.org/W3099330747","https://openalex.org/W3124972797","https://openalex.org/W3160408143","https://openalex.org/W3160936850","https://openalex.org/W3161301466","https://openalex.org/W3161934504","https://openalex.org/W3163842642","https://openalex.org/W3171278394","https://openalex.org/W3210390090","https://openalex.org/W4221143485","https://openalex.org/W4295312788","https://openalex.org/W6726497184","https://openalex.org/W6731370813","https://openalex.org/W6766978945","https://openalex.org/W6774995033","https://openalex.org/W6775848399","https://openalex.org/W6809924511"],"related_works":["https://openalex.org/W2782029243","https://openalex.org/W2037487247","https://openalex.org/W3015390914","https://openalex.org/W56865080","https://openalex.org/W3000647100","https://openalex.org/W4309128996","https://openalex.org/W4210266374","https://openalex.org/W2962866211","https://openalex.org/W2891283181","https://openalex.org/W2749131051"],"abstract_inverted_index":{"Many":[0],"monaural":[1],"speech":[2,38],"separation":[3,134,164],"models":[4,135],"assume":[5],"that":[6,48,87,156],"the":[7,49,60,66,71,76,81,84,94,106,109,119,127,169],"exact":[8],"number":[9,29,51,61,67,77,139],"of":[10,30,52,62,68,78,125,140,160],"speakers":[11,53,69],"is":[12,17,54,73],"known":[13,55],"in":[14,70,80,93,122],"advance,":[15],"which":[16],"not":[18,89],"applicable":[19],"to":[20,99,117,148],"many":[21],"real-world":[22],"scenarios.":[23],"To":[24],"deal":[25],"with":[26,129,136,167],"an":[27],"unknown":[28],"speakers,":[31],"previous":[32],"approaches":[33],"either":[34],"iteratively":[35],"separate":[36],"one":[37],"at":[39],"a":[40,44,56,130,137,146],"time,":[41],"or":[42,108],"employ":[43],"more":[45],"relaxed":[46],"assumption":[47],"maximum":[50],"priori":[57],"and":[58],"set":[59],"outputs":[63,79,86,121],"accordingly.":[64],"When":[65],"mixture":[72,96],"smaller":[74],"than":[75],"latter":[82],"case,":[83],"extra":[85,120,170],"are":[88,97],"mapped":[90],"onto":[91],"signals":[92,103],"input":[95,110],"trained":[98],"produce":[100],"predefined":[101,161],"target":[102,132],"such":[104],"as":[105],"silence":[107],"mixture.":[111],"In":[112],"this":[113],"letter,":[114],"we":[115],"propose":[116],"ignore":[118],"training":[123],"instead":[124],"evaluating":[126],"cost":[128],"certain":[131],"for":[133],"fixed":[138],"output":[141,151],"channels.":[142],"We":[143],"also":[144],"introduce":[145],"method":[147],"select":[149],"valid":[150],"signals.":[152],"Experimental":[153],"results":[154],"showed":[155],"assigning":[157],"any":[158],"type":[159],"targets":[162],"degraded":[163],"performance":[165],"compared":[166],"ignoring":[168],"outputs.":[171]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
