{"id":"https://openalex.org/W1492653331","doi":"https://doi.org/10.21437/interspeech.2010-173","title":"Context adaptive training with factorized decision trees for HMM-based speech synthesis","display_name":"Context adaptive training with factorized decision trees for HMM-based speech synthesis","publication_year":2010,"publication_date":"2010-09-26","ids":{"openalex":"https://openalex.org/W1492653331","doi":"https://doi.org/10.21437/interspeech.2010-173","mag":"1492653331"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2010-173","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-173","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043098653","display_name":"Kai Yu","orcid":"https://orcid.org/0000-0002-7102-9826"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Kai Yu","raw_affiliation_strings":["University of Cambridge,"],"affiliations":[{"raw_affiliation_string":"University of Cambridge,","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003420204","display_name":"Heiga Zen","orcid":"https://orcid.org/0000-0002-8959-5471"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Heiga Zen","raw_affiliation_strings":["University of Cambridge,"],"affiliations":[{"raw_affiliation_string":"University of Cambridge,","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008513708","display_name":"Fran\u00e7ois Mairesse","orcid":"https://orcid.org/0000-0002-4969-4600"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Fran\u00e7ois Mairesse","raw_affiliation_strings":["University of Cambridge,"],"affiliations":[{"raw_affiliation_string":"University of Cambridge,","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":null,"display_name":"Steve Young","orcid":null},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Steve Young","raw_affiliation_strings":["University of Cambridge, Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5043098653"],"corresponding_institution_ids":["https://openalex.org/I241749"],"apc_list":null,"apc_paid":null,"fwci":0.9327,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.79265952,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"414","last_page":"417"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7862603664398193},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.7723957300186157},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.6914883852005005},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6874237060546875},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.5413435101509094},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5369460582733154},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.528761088848114},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5185475945472717},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5075579881668091},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4137776494026184},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.41075676679611206},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4095173478126526},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.05924138426780701}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7862603664398193},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.7723957300186157},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.6914883852005005},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6874237060546875},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.5413435101509094},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5369460582733154},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.528761088848114},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5185475945472717},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5075579881668091},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4137776494026184},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.41075676679611206},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4095173478126526},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.05924138426780701},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.21437/interspeech.2010-173","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-173","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.174.7782","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.174.7782","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://mi.eng.cam.ac.uk/%7Esjy/papers/yzmy10.pdf","raw_type":"text"},{"id":"pmh:oai:generic.eprints.org:343316","is_oa":false,"landing_page_url":"http://publications.eng.cam.ac.uk/343316/","pdf_url":null,"source":{"id":"https://openalex.org/S4406922847","display_name":"Cambridge University Engineering Department Publications Database","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference or Workshop Item"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7900000214576721,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W35069904","https://openalex.org/W102093577","https://openalex.org/W1507900585","https://openalex.org/W1599512239","https://openalex.org/W1600722501","https://openalex.org/W2000513720","https://openalex.org/W2002342963","https://openalex.org/W2048389584","https://openalex.org/W2049686551","https://openalex.org/W2069631319","https://openalex.org/W2093450784","https://openalex.org/W2103279870","https://openalex.org/W2143361917","https://openalex.org/W2146871184","https://openalex.org/W2154920538","https://openalex.org/W2158069733","https://openalex.org/W2740537351"],"related_works":["https://openalex.org/W2053269318","https://openalex.org/W2364370872","https://openalex.org/W2025614924","https://openalex.org/W2294335174","https://openalex.org/W2097963413","https://openalex.org/W3145575561","https://openalex.org/W2001275470","https://openalex.org/W2073996508","https://openalex.org/W1591475660","https://openalex.org/W2086773623"],"abstract_inverted_index":{"To":[0,57],"achieve":[1],"natural":[2],"high":[3],"quality":[4],"synthesised":[5],"speech":[6,9,174],"in":[7,47],"HMMbased":[8],"synthesis,":[10,175],"the":[11,35,64,114,123,157,163,168],"effective":[12],"modelling":[13],"of":[14,38,97,126],"complex":[15],"acoustic":[16],"and":[17,62,69,91,116,130,137],"linguistic":[18],"contexts":[19,61,71,90],"is":[20],"critical.":[21],"Traditional":[22],"approaches":[23,154],"use":[24],"context-dependent":[25],"HMMs":[26,87],"with":[27],"decision":[28,107,180],"tree":[29,181],"based":[30,139,165],"parameter":[31],"clustering":[32],"to":[33,52,102,110],"model":[34,59],"full":[36],"combination":[37],"contexts.":[39,99],"However,":[40,162],"weak":[41,60,68,98,115],"contexts,":[42],"such":[43],"as":[44],"word-level":[45,144],"emphasis":[46,145],"neutral":[48],"speech,":[49],"are":[50],"difficult":[51],"capture":[53],"using":[54],"this":[55,84],"approach.":[56,161],"effectively":[58],"reduce":[63],"data":[65],"sparsity":[66],"problem,":[67],"normal":[70,89,117],"should":[72],"be":[73,111],"treated":[74],"independently.":[75],"Context":[76],"adaptive":[77,104,128,152,177],"training":[78,129,153],"provides":[79],"a":[80,143],"structured":[81],"framework":[82,125],"for":[83,113],"whereby":[85],"standard":[86,158],"represent":[88,94],"linear":[92],"transforms":[93],"additional":[95],"effects":[96],"In":[100],"contrast":[101],"speaker":[103],"training,":[105,178],"separate":[106],"trees":[108],"have":[109],"built":[112],"context":[118,127,151,176],"factors.":[119],"This":[120],"paper":[121],"describes":[122],"general":[124],"investigates":[131],"three":[132],"concrete":[133],"forms:":[134],"MLLR,":[135],"CMLLR":[136],"CAT":[138],"systems.":[140],"Experiments":[141],"on":[142],"synthesis":[146],"task":[147],"show":[148],"that":[149],"all":[150],"can":[155],"outperform":[156],"full-context-dependent":[159],"HMM":[160],"MLLR":[164],"system":[166],"achieved":[167],"best":[169],"performance.":[170],"Index":[171],"Terms:":[172],"HMM-based":[173],"factorized":[179]},"counts_by_year":[{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
