{"id":"https://openalex.org/W4403134597","doi":"https://doi.org/10.3390/info15100608","title":"Threshold-Based Combination of Ideal Binary Mask and Ideal Ratio Mask for Single-Channel Speech Separation","display_name":"Threshold-Based Combination of Ideal Binary Mask and Ideal Ratio Mask for Single-Channel Speech Separation","publication_year":2024,"publication_date":"2024-10-04","ids":{"openalex":"https://openalex.org/W4403134597","doi":"https://doi.org/10.3390/info15100608"},"language":"en","primary_location":{"id":"doi:10.3390/info15100608","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info15100608","pdf_url":"https://www.mdpi.com/2078-2489/15/10/608/pdf?version=1728039651","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2078-2489/15/10/608/pdf?version=1728039651","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100338432","display_name":"Peng Chen","orcid":"https://orcid.org/0000-0001-7522-3813"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Peng Chen","raw_affiliation_strings":["Graduate School of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068261641","display_name":"Binh Thien Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Binh Thien Nguyen","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075933324","display_name":"Kenta Iwai","orcid":"https://orcid.org/0000-0002-9738-8579"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenta Iwai","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009257831","display_name":"Takanobu Nishiura","orcid":"https://orcid.org/0000-0002-1706-4743"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Takanobu Nishiura","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University, Ibaraki 567-8570, Osaka, Japan","institution_ids":["https://openalex.org/I135768898"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5009257831","https://openalex.org/A5100338432"],"corresponding_institution_ids":["https://openalex.org/I135768898"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":1.0979,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.77776016,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"15","issue":"10","first_page":"608","last_page":"608"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ideal","display_name":"Ideal (ethics)","score":0.8364454507827759},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.6785237789154053},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.5796903967857361},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.5679972171783447},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3328055143356323},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.33016064763069153},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.3221539258956909},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.28822678327560425},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.18372175097465515},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.1176881194114685},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.09714463353157043},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.06203567981719971}],"concepts":[{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.8364454507827759},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.6785237789154053},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.5796903967857361},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.5679972171783447},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3328055143356323},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.33016064763069153},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.3221539258956909},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28822678327560425},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.18372175097465515},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.1176881194114685},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.09714463353157043},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.06203567981719971},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/info15100608","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info15100608","pdf_url":"https://www.mdpi.com/2078-2489/15/10/608/pdf?version=1728039651","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:d669799ce8d34b1badb77dffb22ac884","is_oa":true,"landing_page_url":"https://doaj.org/article/d669799ce8d34b1badb77dffb22ac884","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Information, Vol 15, Iss 10, p 608 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/info15100608","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info15100608","pdf_url":"https://www.mdpi.com/2078-2489/15/10/608/pdf?version=1728039651","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403134597.pdf"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W160800111","https://openalex.org/W190004713","https://openalex.org/W285277413","https://openalex.org/W1897240248","https://openalex.org/W1936725236","https://openalex.org/W1979099822","https://openalex.org/W2027701650","https://openalex.org/W2031647436","https://openalex.org/W2041823554","https://openalex.org/W2044222806","https://openalex.org/W2053165762","https://openalex.org/W2058676219","https://openalex.org/W2060822897","https://openalex.org/W2069681747","https://openalex.org/W2078528584","https://openalex.org/W2087126002","https://openalex.org/W2097242476","https://openalex.org/W2127851351","https://openalex.org/W2128653836","https://openalex.org/W2129244720","https://openalex.org/W2141113219","https://openalex.org/W2141411743","https://openalex.org/W2161863519","https://openalex.org/W2167090878","https://openalex.org/W2345067732","https://openalex.org/W2408744528","https://openalex.org/W2598036111","https://openalex.org/W2678916739","https://openalex.org/W2790760353","https://openalex.org/W2794289187","https://openalex.org/W2890111732","https://openalex.org/W2895188252","https://openalex.org/W2962866211","https://openalex.org/W2998155746","https://openalex.org/W3100732527","https://openalex.org/W4245919820","https://openalex.org/W4256161595","https://openalex.org/W4321600175"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2935759653","https://openalex.org/W3105167352","https://openalex.org/W54078636","https://openalex.org/W2954470139","https://openalex.org/W1501425562","https://openalex.org/W2902782467","https://openalex.org/W3084825885","https://openalex.org/W2004554462","https://openalex.org/W2791440692"],"abstract_inverted_index":{"An":[0],"effective":[1],"approach":[2],"to":[3,30,67,81,120],"addressing":[4],"the":[5,35,44,89,111,122,125,145,155,171,175,178,185,198],"speech":[6,32,41,50,85,97,131,188],"separation":[7,98,132,189],"problem":[8],"is":[9,37,46],"utilizing":[10],"a":[11,105,117,135],"time\u2013frequency":[12],"(T-F)":[13],"mask.":[14],"The":[15],"ideal":[16,21,63,101],"binary":[17],"mask":[18,23,65,173],"(IBM)":[19],"and":[20,57,103,140,162,180,182],"ratio":[22,157,160,164],"(IRM)":[24],"have":[25],"long":[26,141],"been":[27],"widely":[28],"used":[29],"separate":[31],"signals.":[33],"However,":[34],"IBM":[36,179],"better":[38,47],"at":[39,48],"improving":[40,49],"intelligibility,":[42],"while":[43],"IRM":[45,181],"quality.":[51],"To":[52],"leverage":[53],"their":[54],"respective":[55],"strengths":[56,176],"overcome":[58],"weaknesses,":[59],"we":[60,128],"propose":[61],"an":[62],"threshold-based":[64],"(ITM)":[66],"combine":[68],"these":[69,76],"two":[70,74,77],"masks.":[71,202],"By":[72,113],"adjusting":[73],"thresholds,":[75],"masks":[78,115],"are":[79],"combined":[80],"jointly":[82],"act":[83],"on":[84,96],"separation.":[86],"We":[87],"list":[88],"impact":[90],"of":[91,124,147,177,187,200],"using":[92,114],"different":[93,201],"threshold":[94],"combinations":[95],"performance":[99],"under":[100],"conditions":[102],"discuss":[104],"reasonable":[106],"range":[107],"for":[108],"fine":[109],"tuning":[110],"thresholds.":[112],"as":[116],"training":[118],"target,":[119],"evaluate":[121],"effectiveness":[123],"proposed":[126,172],"method,":[127],"conducted":[129],"supervised":[130],"experiments":[133],"applying":[134],"deep":[136],"neural":[137],"network":[138],"(DNN)":[139],"short-term":[142],"memory":[143],"(LSTM),":[144],"results":[146,168],"which":[148],"were":[149],"measured":[150],"by":[151,195],"three":[152],"objective":[153],"indicators:":[154],"signal-to-distortion":[156],"(SDR),":[158],"signal-to-interference":[159],"(SIR),":[161],"signal-to-artifact":[163],"improvement":[165],"(SAR).":[166],"Experimental":[167],"show":[169],"that":[170,184],"combines":[174],"implies":[183],"accuracy":[186],"can":[190],"potentially":[191],"be":[192],"further":[193],"improved":[194],"effectively":[196],"leveraging":[197],"advantages":[199]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
