{"id":"https://openalex.org/W2096195361","doi":"https://doi.org/10.1109/chinsl.2004.1409615","title":"A superposed prosodic model for Chinese text-to-speech synthesis","display_name":"A superposed prosodic model for Chinese text-to-speech synthesis","publication_year":2005,"publication_date":"2005-04-06","ids":{"openalex":"https://openalex.org/W2096195361","doi":"https://doi.org/10.1109/chinsl.2004.1409615","mag":"2096195361"},"language":"en","primary_location":{"id":"doi:10.1109/chinsl.2004.1409615","is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinsl.2004.1409615","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SympoTIC '04. Joint 1st Workshop on Mobile Future &amp; Symposium on Trends In Communications (IEEE Cat. No.04EX877)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108533915","display_name":"Gao-Peng Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gao-Peng Chen","raw_affiliation_strings":["Iflvtek Speech Lab, University of Science & Technology of China","Iflytek Speech Laboratory, University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Iflvtek Speech Lab, University of Science & Technology of China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Iflytek Speech Laboratory, University of Science and Technology, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071432574","display_name":"G\u00e9rard Bailly","orcid":"https://orcid.org/0000-0002-6053-0818"},"institutions":[{"id":"https://openalex.org/I4210089785","display_name":"Institut des sciences de la communication","ror":"https://ror.org/00801j392","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I39804081","https://openalex.org/I4210089785","https://openalex.org/I4210127448","https://openalex.org/I4210139971"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"G. Bailly","raw_affiliation_strings":["Institut de la Communication Parlee, CNRS/INPG/U3"],"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parlee, CNRS/INPG/U3","institution_ids":["https://openalex.org/I4210089785"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039181878","display_name":"Qingfeng Liu","orcid":"https://orcid.org/0000-0001-5437-4946"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing-Feng Liu","raw_affiliation_strings":["Iflvtek Speech Lab, University of Science & Technology of China","Iflytek Speech Laboratory, University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Iflvtek Speech Lab, University of Science & Technology of China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Iflytek Speech Laboratory, University of Science and Technology, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045299550","display_name":"Ren-Hua Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ren-Hua Wang","raw_affiliation_strings":["Iflvtek Speech Lab, University of Science & Technology of China","Iflytek Speech Laboratory, University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Iflvtek Speech Lab, University of Science & Technology of China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Iflytek Speech Laboratory, University of Science and Technology, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108533915"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":2.6325,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.90698471,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"177","last_page":"180"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prosody","display_name":"Prosody","score":0.8119261860847473},{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.7008876204490662},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6906444430351257},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6864492893218994},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5747570395469666},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.571996808052063},{"id":"https://openalex.org/keywords/stress","display_name":"Stress (linguistics)","score":0.550653874874115},{"id":"https://openalex.org/keywords/superposition-principle","display_name":"Superposition principle","score":0.537708044052124},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5080289840698242},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5011196136474609},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.4807281792163849},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.45074373483657837},{"id":"https://openalex.org/keywords/syllabic-verse","display_name":"Syllabic verse","score":0.43031471967697144},{"id":"https://openalex.org/keywords/pitch-contour","display_name":"Pitch contour","score":0.42685043811798096},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3855689764022827},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.169343501329422},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.15513557195663452},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.08975064754486084}],"concepts":[{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.8119261860847473},{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.7008876204490662},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6906444430351257},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6864492893218994},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5747570395469666},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.571996808052063},{"id":"https://openalex.org/C21036866","wikidata":"https://www.wikidata.org/wiki/Q181767","display_name":"Stress (linguistics)","level":2,"score":0.550653874874115},{"id":"https://openalex.org/C27753989","wikidata":"https://www.wikidata.org/wiki/Q284885","display_name":"Superposition principle","level":2,"score":0.537708044052124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5080289840698242},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5011196136474609},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.4807281792163849},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.45074373483657837},{"id":"https://openalex.org/C194051139","wikidata":"https://www.wikidata.org/wiki/Q2629608","display_name":"Syllabic verse","level":2,"score":0.43031471967697144},{"id":"https://openalex.org/C2777895490","wikidata":"https://www.wikidata.org/wiki/Q7198848","display_name":"Pitch contour","level":2,"score":0.42685043811798096},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3855689764022827},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.169343501329422},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.15513557195663452},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.08975064754486084},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/chinsl.2004.1409615","is_oa":false,"landing_page_url":"https://doi.org/10.1109/chinsl.2004.1409615","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SympoTIC '04. Joint 1st Workshop on Mobile Future &amp; Symposium on Trends In Communications (IEEE Cat. No.04EX877)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8100000023841858}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W141443464","https://openalex.org/W1505114477","https://openalex.org/W1523104099","https://openalex.org/W1594337151","https://openalex.org/W1999054645","https://openalex.org/W2034277951","https://openalex.org/W2093414802","https://openalex.org/W2104674061","https://openalex.org/W2113104907","https://openalex.org/W2126289105","https://openalex.org/W2162304437","https://openalex.org/W4285719527","https://openalex.org/W4390911627","https://openalex.org/W6635375606","https://openalex.org/W6675738750","https://openalex.org/W6860825834"],"related_works":["https://openalex.org/W234770729","https://openalex.org/W2588431733","https://openalex.org/W2391796527","https://openalex.org/W2387179309","https://openalex.org/W2388979876","https://openalex.org/W10581632","https://openalex.org/W4245668640","https://openalex.org/W1927421023","https://openalex.org/W2032960563","https://openalex.org/W2148228080"],"abstract_inverted_index":{"The":[0,76,108],"paper":[1],"presents":[2],"the":[3,6,15,26,80,83,86,103,127],"application":[4],"of":[5,28,51,53,82,85,105,110],"trainable":[7],"SFC":[8,16],"superpositional":[9],"prosodic":[10,18,38,48],"model":[11,99],"to":[12,60,117],"Chinese.":[13],"Within":[14],"model,":[17],"parameters":[19],"(F0,":[20],"syllabic":[21],"lengthening)":[22],"are":[23,34],"interpreted":[24],"as":[25,45],"superposition":[27],"overlapping":[29],"multiparametric":[30],"contours.":[31],"These":[32],"contours":[33],"associated":[35],"with":[36],"high-level":[37],"features":[39],"operating":[40],"at":[41],"different":[42],"scopes,":[43],"such":[44],"tones,":[46],"stress,":[47],"boundary,":[49],"part":[50],"speech":[52],"words,":[54],"etc.":[55],"Each":[56],"feature":[57],"label":[58],"corresponds":[59],"a":[61,73],"metalinguistic":[62],"function":[63],"(morphological,":[64],"lexical,":[65],"syntactic,":[66],"attitudinal,":[67],"etc.)":[68],"which":[69],"is":[70,79,93,113,121,130],"represented":[71],"by":[72],"neural":[74,88],"network.":[75],"observed":[77],"contour":[78],"sum":[81],"outputs":[84],"corresponding":[87],"networks.":[89],"An":[90],"analysis-by-synthesis":[91],"scheme":[92],"implemented":[94],"for":[95],"automatic":[96],"learning.":[97],"This":[98],"works":[100],"well":[101],"in":[102],"concatenation":[104],"neighbored":[106],"units.":[107],"RMSE":[109],"F0":[111],"prediction":[112],"2.34":[114],"st":[115],"(referenced":[116],"200":[118],"Hz),":[119],"correlation":[120],"0.86.":[122],"Perceptual":[123],"experiments":[124],"show":[125],"that":[126],"predicted":[128],"prosody":[129],"quite":[131],"appropriate":[132],"and":[133],"fluent.":[134]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
