{"id":"https://openalex.org/W4372259805","doi":"https://doi.org/10.1109/icassp49357.2023.10095128","title":"Optimal Condition Training for Target Source Separation","display_name":"Optimal Condition Training for Target Source Separation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372259805","doi":"https://doi.org/10.1109/icassp49357.2023.10095128"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10095128","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095128","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016864112","display_name":"Efthymios Tzinis","orcid":"https://orcid.org/0000-0002-1047-1338"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]},{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Efthymios Tzinis","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","University of Illinois Urbana-Champaign, Urbana, IL, USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"University of Illinois Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086940921","display_name":"Gordon Wichern","orcid":"https://orcid.org/0000-0002-8597-6795"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gordon Wichern","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038903729","display_name":"Paris Smaragdis","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paris Smaragdis","raw_affiliation_strings":["University of Illinois Urbana-Champaign,Urbana,IL,USA","University of Illinois Urbana-Champaign, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,Urbana,IL,USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076453358","display_name":"Jonathan Le Roux","orcid":"https://orcid.org/0000-0002-3451-171X"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Le Roux","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5016864112"],"corresponding_institution_ids":["https://openalex.org/I157725225","https://openalex.org/I4210159266"],"apc_list":null,"apc_paid":null,"fwci":1.2226,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.78597809,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7593991756439209},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.689224898815155},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.5847181677818298},{"id":"https://openalex.org/keywords/permutation","display_name":"Permutation (music)","score":0.5084297060966492},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.447234183549881},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44398224353790283},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.38712042570114136},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3521467447280884},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3384156823158264}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7593991756439209},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.689224898815155},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.5847181677818298},{"id":"https://openalex.org/C21308566","wikidata":"https://www.wikidata.org/wiki/Q7169365","display_name":"Permutation (music)","level":2,"score":0.5084297060966492},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.447234183549881},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44398224353790283},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.38712042570114136},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3521467447280884},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3384156823158264},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10095128","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095128","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1482149378","https://openalex.org/W1522301498","https://openalex.org/W2043095867","https://openalex.org/W2046869671","https://openalex.org/W2078528584","https://openalex.org/W2221409856","https://openalex.org/W2460742184","https://openalex.org/W2644497536","https://openalex.org/W2760103357","https://openalex.org/W2774707525","https://openalex.org/W2891833136","https://openalex.org/W2896457183","https://openalex.org/W2909607850","https://openalex.org/W2936302822","https://openalex.org/W2938646939","https://openalex.org/W2954304925","https://openalex.org/W2962715207","https://openalex.org/W2962753171","https://openalex.org/W2962866211","https://openalex.org/W2963189033","https://openalex.org/W2973062255","https://openalex.org/W2990666817","https://openalex.org/W2991107219","https://openalex.org/W2997987128","https://openalex.org/W3015201698","https://openalex.org/W3015605047","https://openalex.org/W3095263845","https://openalex.org/W3105645800","https://openalex.org/W3191469971","https://openalex.org/W3215562486","https://openalex.org/W4205689591","https://openalex.org/W4224871700","https://openalex.org/W4296069305","https://openalex.org/W4297841626","https://openalex.org/W4312909419","https://openalex.org/W6631190155","https://openalex.org/W6746914816","https://openalex.org/W6755207826","https://openalex.org/W6755462816","https://openalex.org/W6758080106","https://openalex.org/W6804410624","https://openalex.org/W6891861341"],"related_works":["https://openalex.org/W2073713056","https://openalex.org/W3110702597","https://openalex.org/W2078761926","https://openalex.org/W2110441383","https://openalex.org/W2125620709","https://openalex.org/W1498872724","https://openalex.org/W4233149903","https://openalex.org/W4293864700","https://openalex.org/W2524540579","https://openalex.org/W2326878701"],"abstract_inverted_index":{"Recent":[0],"research":[1],"has":[2],"shown":[3],"remarkable":[4],"performance":[5,160],"in":[6,108,161],"leveraging":[7],"multiple":[8,30],"extraneous":[9],"conditional":[10],"and":[11,86,120,154,157],"non-mutually-exclusive":[12],"semantic":[13,80],"concepts":[14,81],"for":[15,45,127],"sound":[16],"source":[17,27,48,129,139,168],"separation,":[18,49,169],"allowing":[19],"the":[20,56,73,78,117,133,162],"flexibility":[21],"to":[22,84,95,116,122],"extract":[23],"a":[24,38,65,101,123],"given":[25,66,118],"target":[26,47,67,128,155],"based":[28,50],"on":[29,51,137],"different":[31],"queries.":[32],"In":[33],"this":[34],"work,":[35],"we":[36,99],"propose":[37,100],"new":[39],"optimal":[40],"condition":[41,59,106,112],"training":[42],"(OCT)":[43],"method":[44],"single-channel":[46],"greedy":[52],"parameter":[53],"updates":[54],"using":[55],"highest":[57],"performing":[58],"among":[60],"equivalent":[61],"conditions":[62],"associated":[63],"with":[64,105,149],"source.":[68],"Our":[69],"experiments":[70,141],"show":[71],"that":[72],"complementary":[74],"information":[75],"carried":[76],"by":[77],"diverse":[79,138],"significantly":[82],"helps":[83],"disentangle":[85],"isolate":[87],"sources":[88,156],"of":[89,103,135,166],"interest":[90],"much":[91],"more":[92,124,163],"efficiently":[93],"compared":[94],"single-conditioned":[96],"models.":[97,175],"Moreover,":[98],"variation":[102],"OCT":[104,136],"refinement,":[107],"which":[109],"an":[110],"initial":[111],"vector":[113],"is":[114],"adapted":[115],"mixture":[119],"transformed":[121],"amenable":[125],"representation":[126],"extraction.":[130],"We":[131],"showcase":[132],"effectiveness":[134],"separation":[140],"where":[142],"it":[143],"improves":[144],"upon":[145],"permutation":[146],"invariant":[147],"models":[148],"oracle":[150],"assignment":[151],"between":[152],"estimated":[153],"obtains":[158],"state-of-the-art":[159],"challenging":[164],"task":[165],"text-based":[167],"outperforming":[170],"even":[171],"dedicated":[172],"text-only":[173],"conditioned":[174]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
