{"id":"https://openalex.org/W2891508564","doi":"https://doi.org/10.1109/taslp.2018.2869692","title":"Gaussian Modeling-Based Multichannel Audio Source Separation Exploiting Generic Source Spectral Model","display_name":"Gaussian Modeling-Based Multichannel Audio Source Separation Exploiting Generic Source Spectral Model","publication_year":2018,"publication_date":"2018-09-12","ids":{"openalex":"https://openalex.org/W2891508564","doi":"https://doi.org/10.1109/taslp.2018.2869692","mag":"2891508564"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2018.2869692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2869692","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-02045480","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003217635","display_name":"Thanh Thi Duong","orcid":"https://orcid.org/0000-0001-5854-5845"},"institutions":[{"id":"https://openalex.org/I29199639","display_name":"Hanoi University of Mining and Geology","ror":"https://ror.org/01rw3qm79","country_code":"VN","type":"education","lineage":["https://openalex.org/I29199639"]},{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Thanh Thi Hien Duong","raw_affiliation_strings":["Hanoi University of Mining and Geology, Hanoi, VN","MICA - International Research Institute MICA (B1-Hanoi University of Science and technology (Truong Dai Hoc Bach Khoa) 1 Dai Co Viet - Hai Ba Trung Hanoi - Vietnam - Vietnam)"],"raw_orcid":"https://orcid.org/0000-0001-5854-5845","affiliations":[{"raw_affiliation_string":"Hanoi University of Mining and Geology, Hanoi, VN","institution_ids":["https://openalex.org/I29199639"]},{"raw_affiliation_string":"MICA - International Research Institute MICA (B1-Hanoi University of Science and technology (Truong Dai Hoc Bach Khoa) 1 Dai Co Viet - Hai Ba Trung Hanoi - Vietnam - Vietnam)","institution_ids":["https://openalex.org/I94518387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041584595","display_name":"Ngoc Q. K. Duong","orcid":"https://orcid.org/0000-0002-7627-8194"},"institutions":[{"id":"https://openalex.org/I2929663463","display_name":"Technicolor (Germany)","ror":"https://ror.org/00besvm65","country_code":"DE","type":"company","lineage":["https://openalex.org/I2929663463","https://openalex.org/I4210121266"]},{"id":"https://openalex.org/I4210121266","display_name":"Technicolor (France)","ror":"https://ror.org/02ya5n776","country_code":"FR","type":"company","lineage":["https://openalex.org/I4210121266"]}],"countries":["DE","FR"],"is_corresponding":false,"raw_author_name":"Ngoc Q. K. Duong","raw_affiliation_strings":["Technicolor R&D, Rennes, France","Technicolor (France)"],"raw_orcid":"https://orcid.org/0000-0002-7627-8194","affiliations":[{"raw_affiliation_string":"Technicolor R&D, Rennes, France","institution_ids":["https://openalex.org/I2929663463"]},{"raw_affiliation_string":"Technicolor (France)","institution_ids":["https://openalex.org/I4210121266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041935140","display_name":"Phuong Cong Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Phuong Cong Nguyen","raw_affiliation_strings":["HUST - Hanoi University of Science and Technology (Institut polytechnique de Hanoi, \r\n1 Dai Co Viet Road, Ha Noi - Vietnam)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HUST - Hanoi University of Science and Technology (Institut polytechnique de Hanoi, \r\n1 Dai Co Viet Road, Ha Noi - Vietnam)","institution_ids":["https://openalex.org/I94518387"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101764507","display_name":"Quoc Cuong Nguyen","orcid":"https://orcid.org/0000-0002-5641-5040"},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Cuong Quoc Nguyen","raw_affiliation_strings":["HUST - Hanoi University of Science and Technology (Institut polytechnique de Hanoi, \r\n1 Dai Co Viet Road, Ha Noi - Vietnam)"],"raw_orcid":"https://orcid.org/0000-0002-5362-2968","affiliations":[{"raw_affiliation_string":"HUST - Hanoi University of Science and Technology (Institut polytechnique de Hanoi, \r\n1 Dai Co Viet Road, Ha Noi - Vietnam)","institution_ids":["https://openalex.org/I94518387"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5003217635"],"corresponding_institution_ids":["https://openalex.org/I29199639","https://openalex.org/I94518387"],"apc_list":null,"apc_paid":null,"fwci":0.8281,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.73911062,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"27","issue":"1","first_page":"32","last_page":"43"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.7638799548149109},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.6482743620872498},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6353319883346558},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.49802112579345703},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.49382147192955017},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.47988998889923096},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.47858166694641113},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.42799967527389526},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4200451672077179},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.362490177154541},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32891392707824707},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.24725788831710815}],"concepts":[{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.7638799548149109},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.6482743620872498},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6353319883346558},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.49802112579345703},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.49382147192955017},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.47988998889923096},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.47858166694641113},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.42799967527389526},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4200451672077179},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.362490177154541},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32891392707824707},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.24725788831710815},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2018.2869692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2869692","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-02045480v1","is_oa":true,"landing_page_url":"https://hal.science/hal-02045480","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2019, 27 (1), pp.32-43. &#x27E8;10.1109/TASLP.2018.2869692&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-02045480v1","is_oa":true,"landing_page_url":"https://hal.science/hal-02045480","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2019, 27 (1), pp.32-43. &#x27E8;10.1109/TASLP.2018.2869692&#x27E9;","raw_type":"Journal articles"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W76597279","https://openalex.org/W147600081","https://openalex.org/W285277413","https://openalex.org/W1518853429","https://openalex.org/W1594771616","https://openalex.org/W1790748249","https://openalex.org/W1842657353","https://openalex.org/W1956364622","https://openalex.org/W1965581401","https://openalex.org/W1969952034","https://openalex.org/W1974186229","https://openalex.org/W1981755271","https://openalex.org/W2001987918","https://openalex.org/W2006590639","https://openalex.org/W2012910847","https://openalex.org/W2017548439","https://openalex.org/W2021196544","https://openalex.org/W2031583051","https://openalex.org/W2039844283","https://openalex.org/W2043095867","https://openalex.org/W2046233597","https://openalex.org/W2049633694","https://openalex.org/W2055401280","https://openalex.org/W2069884666","https://openalex.org/W2082444737","https://openalex.org/W2098101267","https://openalex.org/W2105921478","https://openalex.org/W2113154266","https://openalex.org/W2113990625","https://openalex.org/W2114508388","https://openalex.org/W2117332620","https://openalex.org/W2127851351","https://openalex.org/W2129171989","https://openalex.org/W2135029798","https://openalex.org/W2143027228","https://openalex.org/W2143513973","https://openalex.org/W2149368536","https://openalex.org/W2150415460","https://openalex.org/W2158216966","https://openalex.org/W2159310722","https://openalex.org/W2221409856","https://openalex.org/W2285479626","https://openalex.org/W2408744528","https://openalex.org/W2412956798","https://openalex.org/W2522083103","https://openalex.org/W2549452274","https://openalex.org/W2568308529","https://openalex.org/W2575498233","https://openalex.org/W2580692915","https://openalex.org/W2607108972","https://openalex.org/W2644497536","https://openalex.org/W2806198829","https://openalex.org/W2892163332","https://openalex.org/W2916583660","https://openalex.org/W2916985722","https://openalex.org/W2917831833","https://openalex.org/W2964010042","https://openalex.org/W3124794156","https://openalex.org/W3143596294","https://openalex.org/W6605949115","https://openalex.org/W6631184795","https://openalex.org/W6635652743","https://openalex.org/W6638545978","https://openalex.org/W6640823206","https://openalex.org/W6641352206","https://openalex.org/W6642573306","https://openalex.org/W6643824070","https://openalex.org/W6650663758","https://openalex.org/W6652268800","https://openalex.org/W6653298445","https://openalex.org/W6675183262","https://openalex.org/W6677083428","https://openalex.org/W6680012447","https://openalex.org/W6681200271","https://openalex.org/W6683414387","https://openalex.org/W6688843265","https://openalex.org/W6695735281","https://openalex.org/W6726818740","https://openalex.org/W6732714863","https://openalex.org/W6739510395","https://openalex.org/W6752415752","https://openalex.org/W6754904195","https://openalex.org/W6759212570","https://openalex.org/W6759591289"],"related_works":["https://openalex.org/W2037504162","https://openalex.org/W2774154397","https://openalex.org/W2146544734","https://openalex.org/W1979654135","https://openalex.org/W2156699640","https://openalex.org/W2098101267","https://openalex.org/W2156181515","https://openalex.org/W2158112352","https://openalex.org/W2081322759","https://openalex.org/W1984255382"],"abstract_inverted_index":{"As":[0],"<italic":[1,25,39],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[2,26,40],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">blind</i>":[3],"audio":[4,55],"source":[5,32,70,80,109,128,154,170],"separation":[6,71,165,176],"has":[7],"remained":[8],"very":[9],"challenging":[10],"in":[11,62,111],"real-world":[12],"scenarios,":[13],"some":[14],"existing":[15],"works,":[16],"including":[17],"ours,":[18],"have":[19],"investigated":[20],"the":[21,74,79,92,98,104,107,117,123,135,147,158,169,174,190,199],"use":[22,118],"of":[23,106,119,126,138,189],"a":[24,68,85,153,194],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">weakly":[27],"informed</i>":[28],"approach":[29,50,72,192],"where":[30,73],"generic":[31],"spectral":[33],"models":[34],"(GSSM)":[35],"can":[36,149],"be":[37,60,150],"learned":[38],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">a":[41],"priori</i>":[42],"based":[43],"on":[44],"nonnegative":[45],"matrix":[46],"factorization":[47],"(NMF).":[48],"Such":[49],"was":[51],"derived":[52],"for":[53,97,102],"single-channel":[54],"mixtures":[56],"and":[57,133,182],"shown":[58],"to":[59,168,186],"efficient":[61],"different":[63],"settings.":[64],"This":[65],"paper":[66],"proposes":[67],"multichannel":[69],"GSSM":[75],"is":[76,160],"combined":[77],"with":[78,179,184],"spatial":[81],"covariance":[82],"model":[83],"within":[84,198],"unified":[86],"Gaussian":[87],"modeling":[88],"framework.":[89],"We":[90,172],"present":[91],"generalized":[93],"expectation-minimization":[94],"(EM)":[95],"algorithm":[96],"para-meter":[99],"estimation.":[100],"Especially,":[101],"guiding":[103],"estimation":[105],"intermediate":[108],"variances":[110,125,137],"each":[112,127],"EM":[113],"iteration,":[114],"we":[115],"investigate":[116],"two":[120],"criteria:":[121],"First,":[122],"estimated":[124],"are":[129,141],"constrained":[130,142],"by":[131,143],"NMF,":[132],"finally,":[134],"total":[136],"all":[139],"sources":[140],"NMF":[144],"altogether.":[145],"While":[146],"former":[148],"seen":[151],"as":[152,162],"variance":[155],"denoising":[156],"step,":[157],"latter":[159],"viewed":[161],"an":[163],"additional":[164],"step":[166],"applied":[167],"variance.":[171],"demonstrate":[173],"speech":[175],"performance,":[177],"together":[178],"its":[180],"convergence":[181],"stability":[183],"respect":[185],"parameter":[187],"setting,":[188],"proposed":[191],"using":[193],"benchmark":[195],"dataset":[196],"provided":[197],"2016":[200],"Signal":[201],"Separation":[202],"Evaluation":[203],"Campaign.":[204]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
