{"id":"https://openalex.org/W2116842019","doi":"https://doi.org/10.1109/icassp.2014.6853596","title":"Natural speech synthesis based on hybrid approach with candidate expansion and verification","display_name":"Natural speech synthesis based on hybrid approach with candidate expansion and verification","publication_year":2014,"publication_date":"2014-05-01","ids":{"openalex":"https://openalex.org/W2116842019","doi":"https://doi.org/10.1109/icassp.2014.6853596","mag":"2116842019"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2014.6853596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6853596","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103251327","display_name":"Chung\u2010Hsien Wu","orcid":"https://orcid.org/0000-0002-3947-2123"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Hsien Wu","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","institution_ids":["https://openalex.org/I91807558"]},{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101059668","display_name":"Yi-Chin Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yi-Chin Huang","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","institution_ids":["https://openalex.org/I91807558"]},{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027643159","display_name":"Shih-Lun Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shih-Lun Lin","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan, R.O.C","institution_ids":["https://openalex.org/I91807558"]},{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University , Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004459028","display_name":"Chia-Ping Chen","orcid":"https://orcid.org/0000-0002-0151-2556"},"institutions":[{"id":"https://openalex.org/I142974352","display_name":"National Sun Yat-sen University","ror":"https://ror.org/00mjawt10","country_code":"TW","type":"education","lineage":["https://openalex.org/I142974352"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chia-Ping Chen","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Sun Yat-Sen University, Taiwan, R.O.C","Department of Computer Science and Information Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Sun Yat-Sen University, Taiwan, R.O.C","institution_ids":["https://openalex.org/I142974352"]},{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Sun Yat-sen University, Kaohsiung, Taiwan","institution_ids":["https://openalex.org/I142974352"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8458,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.82132382,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"21","issue":null,"first_page":"250","last_page":"254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9789999723434448,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7898072600364685},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.6782222986221313},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.6711968183517456},{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.6696773171424866},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6690407395362854},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.4962769150733948},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.45378395915031433},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4026327133178711},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35059550404548645},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12339642643928528}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7898072600364685},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.6782222986221313},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.6711968183517456},{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.6696773171424866},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6690407395362854},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.4962769150733948},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.45378395915031433},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4026327133178711},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35059550404548645},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12339642643928528},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2014.6853596","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6853596","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6899999976158142,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W3629425","https://openalex.org/W344150399","https://openalex.org/W1524014603","https://openalex.org/W2004687614","https://openalex.org/W2039241583","https://openalex.org/W2066186361","https://openalex.org/W2137718131","https://openalex.org/W2139525902","https://openalex.org/W2149572519","https://openalex.org/W2161135987","https://openalex.org/W2162295204","https://openalex.org/W2165848216","https://openalex.org/W2365209858","https://openalex.org/W2395647737","https://openalex.org/W2579024677","https://openalex.org/W3142087749","https://openalex.org/W6600138404","https://openalex.org/W6611766843","https://openalex.org/W6631509255","https://openalex.org/W6711853402","https://openalex.org/W6732412368","https://openalex.org/W7025091378"],"related_works":["https://openalex.org/W234770729","https://openalex.org/W4391272374","https://openalex.org/W2588431733","https://openalex.org/W2391796527","https://openalex.org/W1914543332","https://openalex.org/W2387179309","https://openalex.org/W2946856121","https://openalex.org/W40885451","https://openalex.org/W2388979876","https://openalex.org/W4245668640"],"abstract_inverted_index":{"A":[0],"hybrid":[1,143],"Mandarin":[2],"speech":[3,123],"synthesis":[4],"system":[5],"combining":[6],"concatenation-based":[7],"and":[8,89,126,140,162],"model-based":[9,118],"methodology":[10],"is":[11,49,70,96,166],"investigated":[12],"in":[13,168],"this":[14],"research.":[15],"To":[16],"effectively":[17],"exploit":[18],"a":[19,52,76],"small-size":[20],"corpus,":[21],"the":[22,41,73,82,100,103,111,134,137,141,163,170,173],"candidate":[23,148],"sets":[24],"for":[25,121,160],"unit":[26,68],"selection":[27],"are":[28,38,115],"expanded":[29],"via":[30],"clusters":[31],"based":[32,151],"on":[33,81,152],"articulatory":[34,86,153],"features":[35,154],"(AF),":[36],"which":[37,79],"estimated":[39],"as":[40],"outputs":[42],"of":[43,75,102,172],"an":[44,63,66],"artificial":[45],"neural":[46],"network.":[47],"This":[48],"followed":[50],"by":[51,72,117],"filtering":[53],"operation":[54],"incorporating":[55],"residual":[56],"compensation,":[57],"to":[58,98,109,156],"remove":[59],"unsuitable":[60],"units.":[61],"Given":[62],"input":[64],"text,":[65],"optimal":[67],"sequence":[69],"decided":[71],"minimization":[74],"total":[77],"cost,":[78],"depends":[80],"spectral":[83],"features,":[84,87],"contextual":[85],"formants,":[88],"pitch":[90],"values.":[91],"Furthermore,":[92],"prosodic":[93,112],"word":[94,113],"verification":[95,114,164],"integrated":[97],"check":[99],"smoothness":[101],"output":[104,174],"speech.":[105,175],"The":[106],"units":[107,120,158],"failing":[108],"pass":[110],"replaced":[116],"synthesized":[119],"better":[122],"quality.":[124],"Objective":[125],"subjective":[127],"evaluations":[128],"have":[129],"been":[130],"conducted.":[131],"Comparisons":[132],"among":[133],"proposed":[135],"method,":[136,139],"HMM-based":[138],"conventional":[142],"method":[144],"clearly":[145],"show":[146],"that":[147],"set":[149],"expansion":[150],"lead":[155],"more":[157],"suitable":[159],"selection,":[161],"process":[165],"effective":[167],"improving":[169],"naturalness":[171]},"counts_by_year":[{"year":2016,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
