{"id":"https://openalex.org/W3016255156","doi":"https://doi.org/10.1109/icassp40776.2020.9053995","title":"A Maximum Likelihood Approach to Multi-Objective Learning Using Generalized Gaussian Distributions for Dnn-Based Speech Enhancement","display_name":"A Maximum Likelihood Approach to Multi-Objective Learning Using Generalized Gaussian Distributions for Dnn-Based Speech Enhancement","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3016255156","doi":"https://doi.org/10.1109/icassp40776.2020.9053995","mag":"3016255156"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9053995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053995","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064699619","display_name":"Shutong Niu","orcid":"https://orcid.org/0000-0003-0315-1042"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shu-Tong Niu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, Anhui, P.R.China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, Anhui, P.R.China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066595711","display_name":"Jun Du","orcid":"https://orcid.org/0000-0002-2387-0389"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Du","raw_affiliation_strings":["University of Science and Technology of China, Hefei, Anhui, P.R.China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, Anhui, P.R.China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100704805","display_name":"Li Chai","orcid":"https://orcid.org/0000-0001-7906-9913"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Chai","raw_affiliation_strings":["University of Science and Technology of China, Hefei, Anhui, P.R.China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, Anhui, P.R.China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066868860","display_name":"Chin\u2010Hui Lee","orcid":"https://orcid.org/0000-0002-1892-2551"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chin-Hui Lee","raw_affiliation_strings":["Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5064699619"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.4546,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.59447005,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"2","issue":null,"first_page":"6229","last_page":"6233"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6649808883666992},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5742021799087524},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5448278784751892},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5428358316421509},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.519827663898468},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45251017808914185},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.4218378961086273},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3988092541694641},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32292497158050537},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2239997684955597},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1688184142112732},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.08715063333511353},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0621362030506134}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6649808883666992},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5742021799087524},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5448278784751892},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5428358316421509},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.519827663898468},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45251017808914185},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.4218378961086273},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3988092541694641},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32292497158050537},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2239997684955597},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1688184142112732},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.08715063333511353},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0621362030506134},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9053995","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053995","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W258661521","https://openalex.org/W1552314771","https://openalex.org/W1576996184","https://openalex.org/W1974387177","https://openalex.org/W1989364685","https://openalex.org/W1995536493","https://openalex.org/W2044893557","https://openalex.org/W2069681747","https://openalex.org/W2078528584","https://openalex.org/W2110641918","https://openalex.org/W2121973264","https://openalex.org/W2141998673","https://openalex.org/W2397226255","https://openalex.org/W2516342150","https://openalex.org/W2791874741","https://openalex.org/W2910788588","https://openalex.org/W2920582663","https://openalex.org/W2936028438","https://openalex.org/W2937484199","https://openalex.org/W2944686050","https://openalex.org/W2950258612","https://openalex.org/W2963351212","https://openalex.org/W2969917057","https://openalex.org/W6609686331","https://openalex.org/W6712317276"],"related_works":["https://openalex.org/W1630865680","https://openalex.org/W2373767407","https://openalex.org/W3168109306","https://openalex.org/W2056031932","https://openalex.org/W3096184950","https://openalex.org/W4231424160","https://openalex.org/W2275432853","https://openalex.org/W197907117","https://openalex.org/W1964286703","https://openalex.org/W2169866437"],"abstract_inverted_index":{"The":[0,90,157],"multi-objective":[1,67],"learning":[2,68],"using":[3],"minimum":[4],"mean":[5],"squared":[6],"error":[7,34,85,105,117],"criterion":[8],"for":[9,69],"DNN-based":[10,70],"speech":[11,71],"enhancement":[12,72],"(MMSE-MOL-DNN)":[13],"has":[14],"been":[15],"demonstrated":[16],"to":[17,65,74,94,135],"achieve":[18,75,165],"better":[19,166],"performance":[20,167],"than":[21,168],"single":[22],"output":[23],"DNN.":[24],"However,":[25],"one":[26],"problem":[27],"of":[28,79,83,110,114,154,172],"MMSE-MOL-DNN":[29,169],"is":[30,97,122],"that":[31,161],"the":[32,55,66,76,80,100,108,111,115,125,137,142,146],"prediction":[33,84,116],"values":[35,86,118],"on":[36,87,119],"different":[37,88,120,173],"targets":[38,121],"have":[39],"a":[40,133],"very":[41],"broad":[42],"dynamic":[43,81,112],"range,":[44],"causing":[45],"difficulty":[46],"in":[47,60,128,151,170],"DNN":[48],"training.":[49],"In":[50],"this":[51],"paper,":[52],"we":[53,131],"extend":[54],"maximum":[56],"likelihood":[57,92],"approach":[58],"proposed":[59],"our":[61,162],"previous":[62],"work":[63],"[1]":[64],"(ML-MOL-DNN)":[73],"automatic":[77],"adjustment":[78],"range":[82,113],"targets.":[89],"conditional":[91],"function":[93],"be":[95],"maximized":[96],"derived":[98],"under":[99],"generalized":[101],"Gaussian":[102],"distribution":[103],"(GGD)":[104],"model.":[106],"Moreover,":[107],"control":[109],"achieved":[123],"by":[124],"scale":[126],"factors":[127,139],"GGD.":[129],"Furthermore,":[130],"propose":[132],"method":[134],"update":[136],"shape":[138,149],"automatically":[140],"utilizing":[141],"one-to-one":[143],"mapping":[144],"between":[145],"kurtosis":[147],"and":[148],"factor":[150],"GGD":[152],"instead":[153],"manual":[155],"adjustment.":[156],"experimental":[158],"results":[159],"show":[160],"ML-MOL-DNN":[163],"can":[164],"terms":[171],"objective":[174],"measures.":[175]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
