{"id":"https://openalex.org/W2165143604","doi":"https://doi.org/10.1109/tasl.2010.2045237","title":"Thousands of Voices for HMM-Based Speech Synthesis\u2013Analysis and Application of TTS Systems Built on Various ASR Corpora","display_name":"Thousands of Voices for HMM-Based Speech Synthesis\u2013Analysis and Application of TTS Systems Built on Various ASR Corpora","publication_year":2010,"publication_date":"2010-03-16","ids":{"openalex":"https://openalex.org/W2165143604","doi":"https://doi.org/10.1109/tasl.2010.2045237","mag":"2165143604"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2010.2045237","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2010.2045237","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://era.ed.ac.uk/bitstream/1842/3727/1/YamagishiJ_Thousands%20of%20Voices.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007639385","display_name":"Junichi Yamagishi","orcid":"https://orcid.org/0000-0003-2752-3955"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Junichi Yamagishi","raw_affiliation_strings":["Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058936597","display_name":"Bela Usabaev","orcid":null},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bela Usabaev","raw_affiliation_strings":["Universit\u00e4t Tubingen, Tubingen, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit\u00e4t Tubingen, Tubingen, Germany","institution_ids":["https://openalex.org/I8087733"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062516688","display_name":"Simon King","orcid":"https://orcid.org/0000-0002-2694-2843"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Simon King","raw_affiliation_strings":["Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110238677","display_name":"Oliver Watts","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Oliver Watts","raw_affiliation_strings":["Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre of Speech Technology Research CSTR, University of Edinburgh, Edinburgh, UK","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105301736","display_name":"John Dines","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"John Dines","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103093321","display_name":"Jilei Tian","orcid":"https://orcid.org/0000-0002-4588-9398"},"institutions":[{"id":"https://openalex.org/I4210099903","display_name":"Nokia (China)","ror":"https://ror.org/01607kg94","country_code":"CN","type":"company","lineage":["https://openalex.org/I2738502077","https://openalex.org/I4210099903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jilei Tian","raw_affiliation_strings":["Nokia Research Center, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nokia Research Center, Beijing, China","institution_ids":["https://openalex.org/I4210099903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100719922","display_name":"Yong Guan","orcid":"https://orcid.org/0000-0002-9044-2595"},"institutions":[{"id":"https://openalex.org/I4210099903","display_name":"Nokia (China)","ror":"https://ror.org/01607kg94","country_code":"CN","type":"company","lineage":["https://openalex.org/I2738502077","https://openalex.org/I4210099903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Guan","raw_affiliation_strings":["Nokia Research Center, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nokia Research Center, Beijing, China","institution_ids":["https://openalex.org/I4210099903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109250475","display_name":"Rile Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099903","display_name":"Nokia (China)","ror":"https://ror.org/01607kg94","country_code":"CN","type":"company","lineage":["https://openalex.org/I2738502077","https://openalex.org/I4210099903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rile Hu","raw_affiliation_strings":["Nokia Research Center, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nokia Research Center, Beijing, China","institution_ids":["https://openalex.org/I4210099903"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049909008","display_name":"Keiichiro Oura","orcid":null},"institutions":[{"id":"https://openalex.org/I197274945","display_name":"Nagoya Institute of Technology","ror":"https://ror.org/055yf1005","country_code":"JP","type":"education","lineage":["https://openalex.org/I197274945"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Keiichiro Oura","raw_affiliation_strings":["Department of Computer Science and Engineering, Nagoya Institute of Technology, Nagoya, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Nagoya Institute of Technology, Nagoya, Japan","institution_ids":["https://openalex.org/I197274945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039492028","display_name":"Yi-Jian Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I197274945","display_name":"Nagoya Institute of Technology","ror":"https://ror.org/055yf1005","country_code":"JP","type":"education","lineage":["https://openalex.org/I197274945"]},{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN","JP"],"is_corresponding":false,"raw_author_name":"Yi-Jian Wu","raw_affiliation_strings":["Nagoya Institute of Technology, Nagoya, Japan","TTS Group, Microsoft Business Corporation, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nagoya Institute of Technology, Nagoya, Japan","institution_ids":["https://openalex.org/I197274945"]},{"raw_affiliation_string":"TTS Group, Microsoft Business Corporation, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103023678","display_name":"Keiichi Tokuda","orcid":"https://orcid.org/0000-0001-6143-0133"},"institutions":[{"id":"https://openalex.org/I197274945","display_name":"Nagoya Institute of Technology","ror":"https://ror.org/055yf1005","country_code":"JP","type":"education","lineage":["https://openalex.org/I197274945"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Keiichi Tokuda","raw_affiliation_strings":["Department of Computer Science and Engineering, Nagoya Institute of Technology, Nagoya, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Nagoya Institute of Technology, Nagoya, Japan","institution_ids":["https://openalex.org/I197274945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023689975","display_name":"Reima Karhila","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reima Karhila","raw_affiliation_strings":["Adaptive Informatics Research Centre, Helsinki University of Technology, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adaptive Informatics Research Centre, Helsinki University of Technology, Finland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043424064","display_name":"Mikko Kurimo","orcid":"https://orcid.org/0000-0001-5278-7974"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mikko Kurimo","raw_affiliation_strings":["Adaptive Informatics Research Centre, Helsinki University of Technology, Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adaptive Informatics Research Centre, Helsinki University of Technology, Finland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":5,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":14.9169,"has_fulltext":true,"cited_by_count":80,"citation_normalized_percentile":{"value":0.99000941,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"18","issue":"5","first_page":"984","last_page":"1004"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8100028038024902},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.7741106152534485},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.7530756592750549},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7337278723716736},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.45427262783050537},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.35475412011146545}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8100028038024902},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.7741106152534485},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.7530756592750549},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7337278723716736},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.45427262783050537},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35475412011146545},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":7,"locations":[{"id":"doi:10.1109/tasl.2010.2045237","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2010.2045237","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:era.ed.ac.uk:1842/3727","is_oa":true,"landing_page_url":"http://hdl.handle.net/1842/3727","pdf_url":"https://era.ed.ac.uk/bitstream/1842/3727/1/YamagishiJ_Thousands%20of%20Voices.pdf","source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:era.ed.ac.uk:1842/3728","is_oa":false,"landing_page_url":"http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=5431023&tag=1","pdf_url":null,"source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:era.ed.ac.uk:1842/4551","is_oa":false,"landing_page_url":"http://hdl.handle.net/1842/4551","pdf_url":null,"source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:pure.ed.ac.uk:ec_fundedresources/b618da30-0205-4eff-9ab5-488abd0f44f0","is_oa":false,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=77953708096&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:pure.ed.ac.uk:openaire/b618da30-0205-4eff-9ab5-488abd0f44f0","is_oa":false,"landing_page_url":"https://hdl.handle.net/20.500.11820/b618da30-0205-4eff-9ab5-488abd0f44f0","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Yamagishi, J, Usabaev, B, King, S, Watts, O, Dines, J, Tian, J, Guan, Y, Hu, R, Oura, K, Wu, Y-J, Tokuda, K, Karhila, R & Kurimo, M 2010, 'Thousands of Voices for HMM-Based Speech Synthesis-Analysis and Application of TTS Systems Built on Various ASR Corpora', IEEE Transactions on Audio, Speech and Language Processing, vol. 18, no. 5, pp. 984-1004. https://doi.org/10.1109/TASL.2010.2045237","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.ed.ac.uk:publications/b618da30-0205-4eff-9ab5-488abd0f44f0","is_oa":false,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/b618da30-0205-4eff-9ab5-488abd0f44f0","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Yamagishi, J, Usabaev, B, King, S, Watts, O, Dines, J, Tian, J, Guan, Y, Hu, R, Oura, K, Wu, Y-J, Tokuda, K, Karhila, R & Kurimo, M 2010, 'Thousands of Voices for HMM-Based Speech Synthesis-Analysis and Application of TTS Systems Built on Various ASR Corpora', IEEE Transactions on Audio, Speech and Language Processing, vol. 18, no. 5, pp. 984-1004. https://doi.org/10.1109/TASL.2010.2045237","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:era.ed.ac.uk:1842/3727","is_oa":true,"landing_page_url":"http://hdl.handle.net/1842/3727","pdf_url":"https://era.ed.ac.uk/bitstream/1842/3727/1/YamagishiJ_Thousands%20of%20Voices.pdf","source":{"id":"https://openalex.org/S7407055182","display_name":"ERA","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310086","display_name":"Helsingin Yliopisto","ror":"https://ror.org/040af2s02"},{"id":"https://openalex.org/F4320322138","display_name":"Universidad Polit\u00e9cnica de Madrid","ror":"https://ror.org/03n6nwv02"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2165143604.pdf","grobid_xml":"https://content.openalex.org/works/W2165143604.grobid-xml"},"referenced_works_count":81,"referenced_works":["https://openalex.org/W8362967","https://openalex.org/W51508392","https://openalex.org/W66627554","https://openalex.org/W113498433","https://openalex.org/W163148820","https://openalex.org/W204204962","https://openalex.org/W1493817255","https://openalex.org/W1513877108","https://openalex.org/W1521340514","https://openalex.org/W1529897604","https://openalex.org/W1556556182","https://openalex.org/W1564152904","https://openalex.org/W1575512834","https://openalex.org/W1580849279","https://openalex.org/W1592103878","https://openalex.org/W1599512239","https://openalex.org/W1600722501","https://openalex.org/W1963627370","https://openalex.org/W1969876212","https://openalex.org/W1975800736","https://openalex.org/W1984905644","https://openalex.org/W1989337816","https://openalex.org/W2000513720","https://openalex.org/W2000728161","https://openalex.org/W2002342963","https://openalex.org/W2024490156","https://openalex.org/W2042691334","https://openalex.org/W2044871134","https://openalex.org/W2049633694","https://openalex.org/W2049686551","https://openalex.org/W2063415950","https://openalex.org/W2093450784","https://openalex.org/W2100340603","https://openalex.org/W2104653033","https://openalex.org/W2106792148","https://openalex.org/W2111482576","https://openalex.org/W2116046013","https://openalex.org/W2117418893","https://openalex.org/W2119929864","https://openalex.org/W2121566228","https://openalex.org/W2129142580","https://openalex.org/W2130722890","https://openalex.org/W2136545725","https://openalex.org/W2139751012","https://openalex.org/W2142416747","https://openalex.org/W2144139079","https://openalex.org/W2150850689","https://openalex.org/W2153914468","https://openalex.org/W2155977751","https://openalex.org/W2158069733","https://openalex.org/W2165143604","https://openalex.org/W2168884969","https://openalex.org/W2170980774","https://openalex.org/W2186896963","https://openalex.org/W2204452154","https://openalex.org/W2276283915","https://openalex.org/W2296704011","https://openalex.org/W2394921947","https://openalex.org/W2400063444","https://openalex.org/W2402261002","https://openalex.org/W2428180336","https://openalex.org/W2915628810","https://openalex.org/W2917438849","https://openalex.org/W3011402798","https://openalex.org/W4205130185","https://openalex.org/W4229835067","https://openalex.org/W4252316495","https://openalex.org/W4395681711","https://openalex.org/W6602682705","https://openalex.org/W6606716589","https://openalex.org/W6608211636","https://openalex.org/W6630780049","https://openalex.org/W6631254342","https://openalex.org/W6633234927","https://openalex.org/W6676782290","https://openalex.org/W6677333272","https://openalex.org/W6677973343","https://openalex.org/W6712208827","https://openalex.org/W6712610176","https://openalex.org/W6759752890","https://openalex.org/W7075637324"],"related_works":["https://openalex.org/W2136763963","https://openalex.org/W2109705048","https://openalex.org/W2940588515","https://openalex.org/W1909151225","https://openalex.org/W3184123547","https://openalex.org/W2160030256","https://openalex.org/W1521297879","https://openalex.org/W4253235840","https://openalex.org/W3151937861","https://openalex.org/W2488941600"],"abstract_inverted_index":{"In":[0,143],"conventional":[1],"speech":[2,9,60,68,83,154],"synthesis,":[3,36],"large":[4,126],"amounts":[5],"of":[6,39,128,135,140,150,186],"phonetically":[7],"balanced":[8],"data":[10,28,84],"recorded":[11,87],"in":[12],"highly":[13],"controlled":[14],"recording":[15,47],"studio":[16],"environments":[17],"are":[18,49,86,96],"typically":[19],"required":[20],"to":[21,81,108,132],"build":[22],"a":[23,30,125],"voice.":[24],"Although":[25],"using":[26],"such":[27,116,165],"is":[29,79],"straightforward":[31],"solution":[32],"for":[33,152],"high":[34],"quality":[35],"the":[37,52,133,148,167,184],"number":[38,127,139],"voices":[40,112,141,151],"available":[41],"will":[42],"always":[43],"be":[44],"limited,":[45],"because":[46],"costs":[48],"high.":[50],"On":[51],"other":[53],"hand,":[54],"our":[55],"recent":[56],"experiments":[57],"with":[58,92],"HMM-based":[59,67,153],"synthesis":[61,69,155],"systems":[62],"have":[63,158],"demonstrated":[64],"that":[65,85,95,101,156],"speaker-adaptive":[66],"(which":[70],"uses":[71],"an":[72,137],"\u201caverage":[73],"voice":[74],"model\u201d":[75],"plus":[76],"model":[77],"adaptation)":[78],"robust":[80],"non-ideal":[82],"under":[88],"various":[89],"conditions":[90],"and":[91,173,178,193],"varying":[93],"microphones,":[94],"not":[97],"perfectly":[98],"clean,":[99],"and/or":[100],"lack":[102],"phonetic":[103],"balance.":[104],"This":[105],"enables":[106],"us":[107],"consider":[109],"building":[110],"high-quality":[111],"on":[113,190],"\u201cnon-TTS\u201d":[114],"corpora":[115,122,164],"as":[117,166],"ASR":[118,121,163],"corpora.":[119],"Since":[120],"generally":[123],"include":[124],"speakers,":[129],"this":[130,144],"leads":[131],"possibility":[134],"producing":[136],"enormous":[138],"automatically.":[142],"paper,":[145],"we":[146,157],"demonstrate":[147],"thousands":[149],"made":[159],"from":[160],"several":[161],"popular":[162],"Wall":[168],"Street":[169],"Journal":[170],"(WSJ0,":[171],"WSJ1,":[172],"WSJCAM0),":[174],"Resource":[175],"Management,":[176],"Globalphone,":[177],"SPEECON":[179],"databases.":[180],"We":[181],"also":[182],"present":[183],"results":[185],"associated":[187],"analysis":[188],"based":[189],"perceptual":[191],"evaluation,":[192],"discuss":[194],"remaining":[195],"issues.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":9},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":15}],"updated_date":"2026-06-13T07:54:00.901334","created_date":"2025-10-10T00:00:00"}
