{"id":"https://openalex.org/W2133221761","doi":"https://doi.org/10.1109/tasl.2008.2012319","title":"Cepstrum-Domain Model Combination Based on Decomposition of Speech and Noise Using MMSE-LSA for ASR in Noisy Environments","display_name":"Cepstrum-Domain Model Combination Based on Decomposition of Speech and Noise Using MMSE-LSA for ASR in Noisy Environments","publication_year":2009,"publication_date":"2009-03-30","ids":{"openalex":"https://openalex.org/W2133221761","doi":"https://doi.org/10.1109/tasl.2008.2012319","mag":"2133221761"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2008.2012319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2012319","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085604883","display_name":"Hong Kook Kim","orcid":"https://orcid.org/0000-0002-0105-6693"},"institutions":[{"id":"https://openalex.org/I39534123","display_name":"Gwangju Institute of Science and Technology","ror":"https://ror.org/024kbgz78","country_code":"KR","type":"education","lineage":["https://openalex.org/I39534123"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hong Kook Kim","raw_affiliation_strings":["Department of Information and Communications, Gwangju Institute of Science and Technology, Gwangju, South Korea","Dept. of Inf. & Commun., Gwangju Inst. of Sci. & Technol., Gwangju#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Information and Communications, Gwangju Institute of Science and Technology, Gwangju, South Korea","institution_ids":["https://openalex.org/I39534123"]},{"raw_affiliation_string":"Dept. of Inf. & Commun., Gwangju Inst. of Sci. & Technol., Gwangju#TAB#","institution_ids":["https://openalex.org/I39534123"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077077136","display_name":"Richard C. Rose","orcid":null},"institutions":[{"id":"https://openalex.org/I5023651","display_name":"McGill University","ror":"https://ror.org/01pxwe438","country_code":"CA","type":"education","lineage":["https://openalex.org/I5023651"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Richard C. Rose","raw_affiliation_strings":["Department of Electrical and Computer Engineering, McGill University, Montreal, QUE, Canada","[Dept. of Electr. & Comput. Eng., McGill Univ., Montreal, QC]"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, McGill University, Montreal, QUE, Canada","institution_ids":["https://openalex.org/I5023651"]},{"raw_affiliation_string":"[Dept. of Electr. & Comput. Eng., McGill Univ., Montreal, QC]","institution_ids":["https://openalex.org/I5023651"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5085604883"],"corresponding_institution_ids":["https://openalex.org/I39534123"],"apc_list":null,"apc_paid":null,"fwci":0.7049,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.70078474,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"17","issue":"4","first_page":"704","last_page":"713"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.9386148452758789},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7066170573234558},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6942068934440613},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6739494800567627},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44498491287231445},{"id":"https://openalex.org/keywords/time-domain","display_name":"Time domain","score":0.43823832273483276},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4371494650840759},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4348505437374115},{"id":"https://openalex.org/keywords/minimum-mean-square-error","display_name":"Minimum mean square error","score":0.4167175889015198},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.41326141357421875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3715812563896179},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.24477019906044006},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2387983500957489},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.17142146825790405},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13557204604148865}],"concepts":[{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.9386148452758789},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7066170573234558},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6942068934440613},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6739494800567627},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44498491287231445},{"id":"https://openalex.org/C103824480","wikidata":"https://www.wikidata.org/wiki/Q185889","display_name":"Time domain","level":2,"score":0.43823832273483276},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4371494650840759},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4348505437374115},{"id":"https://openalex.org/C90652560","wikidata":"https://www.wikidata.org/wiki/Q11091747","display_name":"Minimum mean square error","level":3,"score":0.4167175889015198},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.41326141357421875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3715812563896179},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.24477019906044006},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2387983500957489},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.17142146825790405},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13557204604148865},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tasl.2008.2012319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2012319","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W79317937","https://openalex.org/W174003511","https://openalex.org/W1614028504","https://openalex.org/W1920183217","https://openalex.org/W1952003395","https://openalex.org/W2045036776","https://openalex.org/W2050693797","https://openalex.org/W2051970538","https://openalex.org/W2059736174","https://openalex.org/W2076979746","https://openalex.org/W2103290541","https://openalex.org/W2110075857","https://openalex.org/W2114548037","https://openalex.org/W2121894251","https://openalex.org/W2121973264","https://openalex.org/W2124611315","https://openalex.org/W2126597753","https://openalex.org/W2128402994","https://openalex.org/W2136586452","https://openalex.org/W2139002649","https://openalex.org/W2146064606","https://openalex.org/W2146871184","https://openalex.org/W2150660184","https://openalex.org/W2151484683","https://openalex.org/W2152131029","https://openalex.org/W2158336491","https://openalex.org/W2160806989","https://openalex.org/W2161151281","https://openalex.org/W2168362601","https://openalex.org/W3147539069","https://openalex.org/W6603280604","https://openalex.org/W6680471220","https://openalex.org/W6682194319"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W2373675101","https://openalex.org/W4385672897","https://openalex.org/W106160982","https://openalex.org/W2359140082","https://openalex.org/W2074132948","https://openalex.org/W2160511961","https://openalex.org/W2361247493"],"abstract_inverted_index":{"This":[0,21,86],"paper":[1,233],"presents":[2],"an":[3],"efficient":[4,91],"method":[5,22,87,132,158],"for":[6,13],"combining":[7,174],"models":[8,142],"of":[9,28,69,152,166,239,244],"speech":[10,15,30,33,73,175],"and":[11,35,75,143,176,181,196,225,248],"noise":[12,37,77,84,118,141,178,223],"robust":[14],"recognition":[16,51,188],"applications":[17],"in":[18,105,111,127],"noisy":[19,56],"environments.":[20],"decomposes":[23],"the":[24,106,112,153,206,237],"cepstrum":[25,34,38,57,70,107],"domain":[26,58,71,108],"representation":[27],"noise-corrupted":[29],"into":[31],"clean":[32,72],"background":[36,76,117,140,177,222],"components":[39],"using":[40,60,80],"a":[41,61,124,135,162,170,184,200,212,242],"minimum":[42],"mean":[43],"squared":[44],"error-log":[45],"spectral":[46,114],"amplitude":[47],"(MMSE-LSA)":[48],"criterion.":[49],"Speech":[50],"is":[52,64,88,102,121,159,191,203,217],"then":[53],"performed":[54,103],"on":[55,183],"observations":[59],"model":[62,95,100,119,156,179,208,249],"that":[63,205,216],"formed":[65],"by":[66],"parallel":[67,94],"combination":[68,96,101,157,209,243,250],"distributions":[74,78],"estimated":[79],"this":[81,131,254],"MMSE-LSA":[82],"based":[83],"decomposition.":[85],"far":[89],"more":[90],"than":[92,110],"other":[93],"(PMC)":[97],"procedures":[98],"because":[99],"directly":[104],"rather":[109],"linear":[113],"domain.":[115],"Whereas":[116],"estimation":[120],"addressed":[122],"as":[123],"separate":[125],"issue":[126],"existing":[128],"PMC":[129,167,220],"procedures,":[130],"explicitly":[133],"incorporates":[134],"mechanism":[136],"to":[137,193,219,230,253],"continually":[138],"update":[139],"signal-to-noise":[144],"ratio":[145],"(SNR)":[146],"estimates":[147],"over":[148],"time.":[149],"The":[150,232],"performance":[151],"proposed":[154,207],"cepstrum-domain":[155,245],"compared":[160],"with":[161],"well":[163],"known":[164,228],"implementation":[165],"which":[168,190],"uses":[169],"log-normal":[171],"approximation":[172],"when":[173,221],"means":[180],"variances":[182],"connected":[185],"digit":[186],"string":[187],"task":[189],"subjected":[192],"mismatched":[194],"channel":[195],"environment":[197],"conditions.":[198],"As":[199],"result,":[201],"it":[202],"shown":[204],"technique":[210],"gives":[211],"word":[213],"error":[214],"rate":[215],"comparable":[218],"information":[224],"SNR":[226],"are":[227,251],"prior":[229],"estimation.":[231],"will":[234],"also":[235],"present":[236],"results":[238],"experiments":[240],"where":[241],"feature":[246],"compensation":[247],"applied":[252],"task.":[255]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
