{"id":"https://openalex.org/W2008709751","doi":"https://doi.org/10.1109/chinasip.2014.6889236","title":"Enhanced power-normalized features for mandarin robust speech recognition based on a voiced-unvoiced-silence decision","display_name":"Enhanced power-normalized features for mandarin robust speech recognition based on a voiced-unvoiced-silence decision","publication_year":2014,"publication_date":"2014-07-01","ids":{"openalex":"https://openalex.org/W2008709751","doi":"https://doi.org/10.1109/chinasip.2014.6889236","mag":"2008709751"},"language":"en","primary_location":{"id":"doi:10.1109/chinasip.2014.6889236","is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinasip.2014.6889236","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE China Summit &amp; International Conference on Signal and Information Processing (ChinaSIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011663086","display_name":"Ying-Wei Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ying-Wei Tan","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039635290","display_name":"Wenju Liu","orcid":"https://orcid.org/0000-0001-9088-8282"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen-Ju Liu","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084649692","display_name":"Zhanlei Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhan-Lei Yang","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100429432","display_name":"Mingming Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming-Ming Chen","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Nat. Lab. of Pattern Recognition, Inst. of Autom., Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5011663086"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210094879","https://openalex.org/I4210112150"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.08362269,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"495","issue":null,"first_page":"222","last_page":"226"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.8771087527275085},{"id":"https://openalex.org/keywords/silence","display_name":"Silence","score":0.8228920698165894},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.8062359094619751},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7185837626457214},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.4924486577510834},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.4827508330345154},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.43400442600250244},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.363651305437088},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3524513840675354},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.14024734497070312},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.09567281603813171}],"concepts":[{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.8771087527275085},{"id":"https://openalex.org/C2781115785","wikidata":"https://www.wikidata.org/wiki/Q502261","display_name":"Silence","level":2,"score":0.8228920698165894},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.8062359094619751},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7185837626457214},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.4924486577510834},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.4827508330345154},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.43400442600250244},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.363651305437088},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3524513840675354},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.14024734497070312},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.09567281603813171},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/chinasip.2014.6889236","is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinasip.2014.6889236","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE China Summit &amp; International Conference on Signal and Information Processing (ChinaSIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.75,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1489183891","https://openalex.org/W1557725510","https://openalex.org/W1974387177","https://openalex.org/W1992272902","https://openalex.org/W2017159651","https://openalex.org/W2030937226","https://openalex.org/W2042211079","https://openalex.org/W2045036776","https://openalex.org/W2114719288","https://openalex.org/W2115717467","https://openalex.org/W2126597753","https://openalex.org/W2151484683","https://openalex.org/W2396358341","https://openalex.org/W2401185733","https://openalex.org/W2518699868","https://openalex.org/W4285719527","https://openalex.org/W6654595128"],"related_works":["https://openalex.org/W2008709751","https://openalex.org/W2120827176","https://openalex.org/W3163132306","https://openalex.org/W2098913653","https://openalex.org/W6852854","https://openalex.org/W2314298589","https://openalex.org/W2397855697","https://openalex.org/W4312095922","https://openalex.org/W2143864059","https://openalex.org/W2368779261"],"abstract_inverted_index":{"Power-normalized":[0],"features":[1,109],"have":[2],"been":[3],"shown":[4],"to":[5,33,58,114],"improve":[6],"the":[7,61,67,84,101,135],"performance":[8],"of":[9,26,43,69],"English":[10],"large":[11],"vocabulary":[12],"continuous":[13,128],"speech":[14,129],"recognition":[15,124,130],"under":[16],"different":[17,31,36],"acoustic":[18],"conditions.":[19],"In":[20],"this":[21],"paper,":[22],"considering":[23],"tone":[24],"characteristics":[25],"Mandarin":[27,117,127],"speech,":[28],"we":[29],"adopt":[30],"strategies":[32],"deal":[34],"with":[35],"sounds":[37],"based":[38,50],"on":[39,51],"a":[40,52,105],"voiced-unvoiced-silence":[41],"decision":[42],"sounds.":[44],"For":[45,81,89],"voiced":[46],"sounds,":[47,83,91],"harmonic":[48,63],"enhancement":[49],"weighted":[53],"harmonic-noise-model":[54],"(WHNM)":[55],"is":[56,79,86,98],"applied":[57],"accurately":[59],"capture":[60],"salient":[62],"information":[64],"and":[65,112],"decreases":[66],"effect":[68],"various":[70],"non-stationary":[71],"noises.":[72],"After":[73],"this,":[74],"standard":[75],"power-normalized":[76,108],"processing":[77],"(SPNP)":[78],"performed.":[80],"unvoiced":[82],"SPNP":[85],"only":[87],"used.":[88],"silence":[90],"an":[92],"quality":[93],"frame":[94],"dropping":[95],"(FD)":[96],"algorithm":[97],"incorporated":[99],"into":[100],"front-end":[102],"properly.":[103],"As":[104],"result,":[106],"enhanced":[107],"are":[110],"obtained":[111],"used":[113],"process":[115],"noise-corrupted":[116],"speech.":[118],"The":[119],"experimental":[120],"results":[121],"show":[122],"better":[123],"accuracies":[125],"for":[126],"in":[131],"noisy":[132],"environments":[133],"over":[134],"ETSI":[136],"Advanced":[137],"Front-End":[138],"(AFE).":[139]},"counts_by_year":[{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
