{"id":"https://openalex.org/W2286859569","doi":"https://doi.org/10.1109/taslp.2016.2553441","title":"Fusion Methods for Speech Enhancement and Audio Source Separation","display_name":"Fusion Methods for Speech Enhancement and Audio Source Separation","publication_year":2016,"publication_date":"2016-04-12","ids":{"openalex":"https://openalex.org/W2286859569","doi":"https://doi.org/10.1109/taslp.2016.2553441","mag":"2286859569"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2016.2553441","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2016.2553441","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003586037","display_name":"Xabier Jaureguiberry","orcid":"https://orcid.org/0000-0001-8568-2538"},"institutions":[{"id":"https://openalex.org/I12356871","display_name":"T\u00e9l\u00e9com Paris","ror":"https://ror.org/01naq7912","country_code":"FR","type":"education","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Xabier Jaureguiberry","raw_affiliation_strings":["Zenly, Paris, France","LTCI - Laboratoire Traitement et Communication de l'Information (46 rue Barrault F-75634 Paris Cedex 13 - France)","TSI - D\u00e9partement Traitement du Signal et des Images (T\u00e9l\u00e9com ParisTech / TSI 46, rue Barrault 75634 PARIS Cedex 13 - France)"],"affiliations":[{"raw_affiliation_string":"Zenly, Paris, France","institution_ids":[]},{"raw_affiliation_string":"LTCI - Laboratoire Traitement et Communication de l'Information (46 rue Barrault F-75634 Paris Cedex 13 - France)","institution_ids":["https://openalex.org/I4210165912"]},{"raw_affiliation_string":"TSI - D\u00e9partement Traitement du Signal et des Images (T\u00e9l\u00e9com ParisTech / TSI 46, rue Barrault 75634 PARIS Cedex 13 - France)","institution_ids":["https://openalex.org/I12356871"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065635001","display_name":"Emmanuel Vincent","orcid":"https://orcid.org/0000-0002-0183-7289"},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210127166","display_name":"Centre Inria de l'Universit\u00e9 de Lorraine","ror":"https://ror.org/03fcjvn64","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210127166"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Emmanuel Vincent","raw_affiliation_strings":["INRIA, Villers-l\u00e8s-Nancy, France","MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)"],"affiliations":[{"raw_affiliation_string":"INRIA, Villers-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210127166","https://openalex.org/I1326498283"]},{"raw_affiliation_string":"MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055423112","display_name":"Ga\u00ebl Richard","orcid":"https://orcid.org/0000-0002-4960-0010"},"institutions":[{"id":"https://openalex.org/I12356871","display_name":"T\u00e9l\u00e9com Paris","ror":"https://ror.org/01naq7912","country_code":"FR","type":"education","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Gael Richard","raw_affiliation_strings":["T\u00e9l\u00e9com ParisTech, Paris, France","LTCI - Laboratoire Traitement et Communication de l'Information (46 rue Barrault F-75634 Paris Cedex 13 - France)","TSI - D\u00e9partement Traitement du Signal et des Images (T\u00e9l\u00e9com ParisTech / TSI 46, rue Barrault 75634 PARIS Cedex 13 - France)"],"affiliations":[{"raw_affiliation_string":"T\u00e9l\u00e9com ParisTech, Paris, France","institution_ids":["https://openalex.org/I12356871"]},{"raw_affiliation_string":"LTCI - Laboratoire Traitement et Communication de l'Information (46 rue Barrault F-75634 Paris Cedex 13 - France)","institution_ids":["https://openalex.org/I4210165912"]},{"raw_affiliation_string":"TSI - D\u00e9partement Traitement du Signal et des Images (T\u00e9l\u00e9com ParisTech / TSI 46, rue Barrault 75634 PARIS Cedex 13 - France)","institution_ids":["https://openalex.org/I12356871"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003586037"],"corresponding_institution_ids":["https://openalex.org/I12356871","https://openalex.org/I4210165912"],"apc_list":null,"apc_paid":null,"fwci":4.081,"has_fulltext":false,"cited_by_count":27,"citation_normalized_percentile":{"value":0.94522076,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"24","issue":"7","first_page":"1266","last_page":"1279"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7275493144989014},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.6771688461303711},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5424178242683411},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5254266262054443},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5248296856880188},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.509566068649292},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4951612055301666},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.49184155464172363},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.4663746953010559},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46248918771743774},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.43865954875946045},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.43442660570144653},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.42540496587753296},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.41748669743537903},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.4154145121574402},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3843453526496887},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37977883219718933},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.22386667132377625},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.20640668272972107},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08909279108047485}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7275493144989014},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.6771688461303711},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5424178242683411},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5254266262054443},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5248296856880188},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.509566068649292},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4951612055301666},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.49184155464172363},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.4663746953010559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46248918771743774},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.43865954875946045},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.43442660570144653},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.42540496587753296},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.41748669743537903},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.4154145121574402},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3843453526496887},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37977883219718933},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.22386667132377625},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.20640668272972107},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08909279108047485},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2016.2553441","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2016.2553441","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-01120685v4","is_oa":false,"landing_page_url":"https://hal.science/hal-01120685","pdf_url":null,"source":{"id":"https://openalex.org/S4406922466","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Audio, Speech and Language Processing, 2016, &#x27E8;10.1109/TASLP.2016.2553441&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W61015563","https://openalex.org/W299739017","https://openalex.org/W994258480","https://openalex.org/W1246381107","https://openalex.org/W1483336436","https://openalex.org/W1486273168","https://openalex.org/W1498436455","https://openalex.org/W1506806321","https://openalex.org/W1544106191","https://openalex.org/W1567997379","https://openalex.org/W1570770495","https://openalex.org/W1574263887","https://openalex.org/W1603903339","https://openalex.org/W1606347560","https://openalex.org/W1663973292","https://openalex.org/W1755563775","https://openalex.org/W1956364622","https://openalex.org/W1966709047","https://openalex.org/W1987906574","https://openalex.org/W1988790447","https://openalex.org/W2010575420","https://openalex.org/W2018832017","https://openalex.org/W2031696998","https://openalex.org/W2035424729","https://openalex.org/W2039844283","https://openalex.org/W2044222806","https://openalex.org/W2046869671","https://openalex.org/W2053165762","https://openalex.org/W2057193929","https://openalex.org/W2062710265","https://openalex.org/W2071467620","https://openalex.org/W2078887028","https://openalex.org/W2087774313","https://openalex.org/W2090681206","https://openalex.org/W2100824854","https://openalex.org/W2101045344","https://openalex.org/W2108849983","https://openalex.org/W2113526703","https://openalex.org/W2116244429","https://openalex.org/W2116542188","https://openalex.org/W2118522520","https://openalex.org/W2125871454","https://openalex.org/W2127851351","https://openalex.org/W2135029798","https://openalex.org/W2139807330","https://openalex.org/W2145668323","https://openalex.org/W2148575186","https://openalex.org/W2158216966","https://openalex.org/W2158275940","https://openalex.org/W2160485598","https://openalex.org/W2160815625","https://openalex.org/W2164098335","https://openalex.org/W2166209411","https://openalex.org/W2225803984","https://openalex.org/W2296573765","https://openalex.org/W2334904945","https://openalex.org/W2395107641","https://openalex.org/W2470294693","https://openalex.org/W2747655461","https://openalex.org/W2798766386","https://openalex.org/W3143596294","https://openalex.org/W4212863985","https://openalex.org/W4248437541","https://openalex.org/W4254313632","https://openalex.org/W6602473807","https://openalex.org/W6625990923","https://openalex.org/W6632676904","https://openalex.org/W6636358008","https://openalex.org/W6655093992","https://openalex.org/W6680012447","https://openalex.org/W6689152417","https://openalex.org/W6697668227","https://openalex.org/W6702735670","https://openalex.org/W6712351927","https://openalex.org/W6720558563"],"related_works":["https://openalex.org/W1509813908","https://openalex.org/W2031820693","https://openalex.org/W3024816962","https://openalex.org/W973023320","https://openalex.org/W1910172735","https://openalex.org/W2118307209","https://openalex.org/W2107364365","https://openalex.org/W2539388437","https://openalex.org/W2107688514","https://openalex.org/W2137288760"],"abstract_inverted_index":{"A":[0],"wide":[1],"variety":[2],"of":[3,52,55,84,129,136,151],"audio":[4,30],"source":[5,31,68],"separation":[6,32,57,63,78],"techniques":[7,58,79],"exist":[8],"and":[9,113],"can":[10],"already":[11],"tackle":[12],"many":[13],"challenging":[14],"industrial":[15],"issues.":[16],"However,":[17],"in":[18,29,37,59,149],"contrast":[19],"with":[20],"other":[21],"application":[22],"domains,":[23],"fusion":[24,47,85,91],"principles":[25],"were":[26],"rarely":[27],"investigated":[28],"despite":[33],"their":[34],"demonstrated":[35],"potential":[36],"classification":[38],"tasks.":[39],"In":[40],"this":[41],"paper,":[42],"we":[43],"propose":[44],"a":[45,82],"general":[46],"framework":[48],"which":[49,93],"takes":[50],"advantage":[51],"the":[53,72,120,134],"diversity":[54],"existing":[56],"order":[60],"to":[61,141,146,155],"improve":[62],"quality.":[64],"We":[65,87],"obtain":[66],"new":[67],"estimates":[69,74],"by":[70,76,81],"summing":[71],"individual":[73],"given":[75],"different":[77],"weighted":[80],"set":[83],"coefficients.":[86],"investigate":[88],"three":[89],"alternative":[90],"methods":[92,122],"are":[94],"based":[95],"on":[96],"standard":[97],"nonlinear":[98],"optimization,":[99],"Bayesian":[100],"model":[101,125,156],"averaging,":[102],"or":[103],"deep":[104,130],"neural":[105,131],"networks.":[106],"Experiments":[107],"conducted":[108],"for":[109,133],"both":[110],"speech":[111],"enhancement":[112],"singing":[114],"voice":[115],"extraction":[116],"demonstrate":[117],"that":[118],"all":[119],"proposed":[121],"outperform":[123],"traditional":[124],"selection.":[126,157],"The":[127],"use":[128],"networks":[132],"estimation":[135],"time-varying":[137],"coefficients":[138],"notably":[139],"leads":[140],"large":[142],"quality":[143],"improvements,":[144],"up":[145],"3":[147],"dB":[148],"terms":[150],"signal-to-distortion":[152],"ratio":[153],"compared":[154]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":7},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2016-06-24T00:00:00"}
