{"id":"https://openalex.org/W2162295204","doi":"https://doi.org/10.1109/tasl.2009.2034771","title":"Hierarchical Prosody Conversion Using Regression-Based Clustering for Emotional Speech Synthesis","display_name":"Hierarchical Prosody Conversion Using Regression-Based Clustering for Emotional Speech Synthesis","publication_year":2009,"publication_date":"2009-10-22","ids":{"openalex":"https://openalex.org/W2162295204","doi":"https://doi.org/10.1109/tasl.2009.2034771","mag":"2162295204"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2009.2034771","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2009.2034771","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103251327","display_name":"Chung\u2010Hsien Wu","orcid":"https://orcid.org/0000-0002-3947-2123"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Hsien Wu","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112618770","display_name":"Chi-Chun Hsia","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chi-Chun Hsia","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106764737","display_name":"Chung-Han Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Han Lee","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036911930","display_name":"Mai-Chun Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148468","display_name":"Industrial Technology Research Institute","ror":"https://ror.org/05szzwt63","country_code":"TW","type":"nonprofit","lineage":["https://openalex.org/I4210148468"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Mai-Chun Lin","raw_affiliation_strings":["Industrial Technology Research Institute-South, ICT-Enabled Healthcare Project, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Industrial Technology Research Institute-South, ICT-Enabled Healthcare Project, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I4210148468"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.6238,"has_fulltext":false,"cited_by_count":58,"citation_normalized_percentile":{"value":0.93442687,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"18","issue":"6","first_page":"1394","last_page":"1405"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prosody","display_name":"Prosody","score":0.8975764513015747},{"id":"https://openalex.org/keywords/pitch-contour","display_name":"Pitch contour","score":0.6162829399108887},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6154675483703613},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5955674648284912},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.588247537612915},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5082178115844727},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5022001266479492},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5009510517120361},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.47309306263923645},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.4643426835536957},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.4458160400390625},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4421869218349457},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3315380811691284},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29541927576065063},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09831702709197998}],"concepts":[{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.8975764513015747},{"id":"https://openalex.org/C2777895490","wikidata":"https://www.wikidata.org/wiki/Q7198848","display_name":"Pitch contour","level":2,"score":0.6162829399108887},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6154675483703613},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5955674648284912},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.588247537612915},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5082178115844727},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5022001266479492},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5009510517120361},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.47309306263923645},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.4643426835536957},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.4458160400390625},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4421869218349457},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3315380811691284},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29541927576065063},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09831702709197998},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tasl.2009.2034771","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2009.2034771","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W83932636","https://openalex.org/W126257978","https://openalex.org/W191556021","https://openalex.org/W250076511","https://openalex.org/W1518567289","https://openalex.org/W1518648436","https://openalex.org/W1528372724","https://openalex.org/W1588037970","https://openalex.org/W1849169576","https://openalex.org/W1926768285","https://openalex.org/W1965392255","https://openalex.org/W2013319990","https://openalex.org/W2034277951","https://openalex.org/W2049633694","https://openalex.org/W2049686551","https://openalex.org/W2096195361","https://openalex.org/W2098831047","https://openalex.org/W2099625897","https://openalex.org/W2100441082","https://openalex.org/W2107713197","https://openalex.org/W2108601574","https://openalex.org/W2110332474","https://openalex.org/W2114659828","https://openalex.org/W2118850452","https://openalex.org/W2120605154","https://openalex.org/W2126289105","https://openalex.org/W2146921187","https://openalex.org/W2149425161","https://openalex.org/W2150791533","https://openalex.org/W2156142001","https://openalex.org/W2161135987","https://openalex.org/W2161736993","https://openalex.org/W2539454895","https://openalex.org/W3113207934","https://openalex.org/W4285719527","https://openalex.org/W4390911438","https://openalex.org/W4402490932","https://openalex.org/W6607864401","https://openalex.org/W6631584049","https://openalex.org/W6674786178","https://openalex.org/W6674890362","https://openalex.org/W6676110152","https://openalex.org/W6728916261"],"related_works":["https://openalex.org/W2385578626","https://openalex.org/W2162295204","https://openalex.org/W2785978752","https://openalex.org/W1533931297","https://openalex.org/W4389356655","https://openalex.org/W2052542215","https://openalex.org/W57220205","https://openalex.org/W1965454423","https://openalex.org/W1965141925","https://openalex.org/W2112390707"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"an":[3,183],"approach":[4],"to":[5,110,129,175],"hierarchical":[6,24,188],"prosody":[7,81,113,121,142,180],"conversion":[8,114,181],"for":[9,73,89,116,141,161,179],"emotional":[10,146],"speech":[11,19,126,148],"synthesis.":[12],"The":[13,35,50],"pitch":[14,36,57,61,74,99],"contour":[15,37,58,62],"of":[16,28,123],"the":[17,39,45,52,55,60,65,77,98,112,124,131,136,172,176,187,192],"source":[18,56,125],"is":[20,42,70],"decomposed":[21],"into":[22],"a":[23,105],"prosodic":[25,30,92,189],"structure":[26,190],"consisting":[27],"sentence,":[29],"word,":[31],"and":[32,59,91,119,138,153,159,163,166,171,191],"subsyllable":[33,96],"levels.":[34],"in":[38],"higher":[40],"level":[41],"encoded":[43],"by":[44],"discrete":[46,66],"Legendre":[47,67],"polynomial":[48,68],"coefficients.":[49],"residual,":[51],"difference":[53],"between":[54],"decoded":[63],"from":[64],"coefficients,":[69],"then":[71],"used":[72,88],"modeling":[75],"at":[76],"lower":[78],"level.":[79],"For":[80],"conversion,":[82],"Gaussian":[83],"mixture":[84],"models":[85],"(GMMs)":[86],"are":[87,102,127],"sentence-":[90],"word-level":[93],"conversion.":[94,143],"At":[95],"level,":[97],"feature":[100],"vectors":[101],"clustered":[103],"via":[104],"proposed":[106,193],"regression-based":[107,194],"clustering":[108,195],"method":[109,178],"generate":[111],"functions":[115],"selection.":[117],"Linguistic":[118],"symbolic":[120],"features":[122],"adopted":[128],"select":[130],"most":[132],"suitable":[133],"function":[134],"using":[135,186],"classification":[137],"regression":[139],"tree":[140],"Three":[144],"small-sized":[145],"parallel":[147],"databases":[149],"with":[150],"happy,":[151],"angry,":[152],"sad":[154],"emotions,":[155],"respectively,":[156],"were":[157,169],"designed":[158],"collected":[160],"training":[162],"evaluation.":[164],"Objective":[165],"subjective":[167],"evaluations":[168],"conducted":[170],"comparison":[173],"results":[174],"GMM-based":[177],"achieved":[182],"improved":[184],"performance":[185],"method.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":8},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":6}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
