{"id":"https://openalex.org/W2395677905","doi":"https://doi.org/10.4018/ijmdem.2016040104","title":"Unit-Selection Speech Synthesis Method Using Words as Search Units","display_name":"Unit-Selection Speech Synthesis Method Using Words as Search Units","publication_year":2016,"publication_date":"2016-04-01","ids":{"openalex":"https://openalex.org/W2395677905","doi":"https://doi.org/10.4018/ijmdem.2016040104","mag":"2395677905"},"language":"en","primary_location":{"id":"doi:10.4018/ijmdem.2016040104","is_oa":true,"landing_page_url":"https://doi.org/10.4018/ijmdem.2016040104","pdf_url":null,"source":{"id":"https://openalex.org/S87630009","display_name":"International Journal of Multimedia Data Engineering and Management","issn_l":"1947-8534","issn":["1947-8534","1947-8542"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320424","host_organization_name":"IGI Global","host_organization_lineage":["https://openalex.org/P4310320424"],"host_organization_lineage_names":["IGI Global"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Multimedia Data Engineering and Management","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.4018/ijmdem.2016040104","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032078198","display_name":"Hiroyuki Segi","orcid":null},"institutions":[{"id":"https://openalex.org/I6030618","display_name":"Seikei University","ror":"https://ror.org/03ptaj492","country_code":"JP","type":"education","lineage":["https://openalex.org/I6030618"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Hiroyuki Segi","raw_affiliation_strings":["Department of Computer and Information Science, Seikei University, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer and Information Science, Seikei University, Tokyo, Japan","institution_ids":["https://openalex.org/I6030618"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5032078198"],"corresponding_institution_ids":["https://openalex.org/I6030618"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02460169,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":"2","first_page":"1","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9423999786376953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9401999711990356,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.7947566509246826},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.779596745967865},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7314481735229492},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.705363392829895},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.6904852986335754},{"id":"https://openalex.org/keywords/waveform","display_name":"Waveform","score":0.48470616340637207},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.47769930958747864},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.45019271969795227},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4346063733100891},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.41141754388809204},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3290495276451111},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3290316164493561},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10490170121192932},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.057413339614868164}],"concepts":[{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.7947566509246826},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.779596745967865},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7314481735229492},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.705363392829895},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.6904852986335754},{"id":"https://openalex.org/C197424946","wikidata":"https://www.wikidata.org/wiki/Q1165717","display_name":"Waveform","level":3,"score":0.48470616340637207},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.47769930958747864},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.45019271969795227},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4346063733100891},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.41141754388809204},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3290495276451111},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3290316164493561},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10490170121192932},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.057413339614868164},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.4018/ijmdem.2016040104","is_oa":true,"landing_page_url":"https://doi.org/10.4018/ijmdem.2016040104","pdf_url":null,"source":{"id":"https://openalex.org/S87630009","display_name":"International Journal of Multimedia Data Engineering and Management","issn_l":"1947-8534","issn":["1947-8534","1947-8542"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320424","host_organization_name":"IGI Global","host_organization_lineage":["https://openalex.org/P4310320424"],"host_organization_lineage_names":["IGI Global"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Multimedia Data Engineering and Management","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:igg:jmdem0:v:7:y:2016:i:2:p:1-15","is_oa":false,"landing_page_url":"http://services.igi-global.com/resolvedoi/resolve.aspx?doi=10.4018/IJMDEM.2016040104","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.4018/ijmdem.2016040104","is_oa":true,"landing_page_url":"https://doi.org/10.4018/ijmdem.2016040104","pdf_url":null,"source":{"id":"https://openalex.org/S87630009","display_name":"International Journal of Multimedia Data Engineering and Management","issn_l":"1947-8534","issn":["1947-8534","1947-8542"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320424","host_organization_name":"IGI Global","host_organization_lineage":["https://openalex.org/P4310320424"],"host_organization_lineage_names":["IGI Global"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Multimedia Data Engineering and Management","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W3979272","https://openalex.org/W88081813","https://openalex.org/W292238991","https://openalex.org/W1516942267","https://openalex.org/W1975376789","https://openalex.org/W1991133427","https://openalex.org/W1992287499","https://openalex.org/W2000513720","https://openalex.org/W2039133177","https://openalex.org/W2042360461","https://openalex.org/W2044320604","https://openalex.org/W2049686551","https://openalex.org/W2049717526","https://openalex.org/W2054748351","https://openalex.org/W2061613332","https://openalex.org/W2073541007","https://openalex.org/W2099727438","https://openalex.org/W2110413797","https://openalex.org/W2120657668","https://openalex.org/W2129142580","https://openalex.org/W2145575463","https://openalex.org/W2150658333","https://openalex.org/W2158069733","https://openalex.org/W2394921947","https://openalex.org/W2402788381","https://openalex.org/W2428180336","https://openalex.org/W2581437851"],"related_works":["https://openalex.org/W2039489009","https://openalex.org/W642007152","https://openalex.org/W4253660971","https://openalex.org/W2401827384","https://openalex.org/W2355290951","https://openalex.org/W2069501481","https://openalex.org/W1909292483","https://openalex.org/W2164147372","https://openalex.org/W2550171623","https://openalex.org/W596245619"],"abstract_inverted_index":{"Unit-selection":[0],"speech-synthesis":[1,11],"systems":[2],"have":[3],"been":[4],"proposed.":[5],"In":[6],"most":[7],"of":[8,56,66,77,100,122],"the":[9,54,57,61,64,78,82,101,120],"unit-selection":[10,123],"systems,":[12],"search":[13,70,129],"units":[14,32],"are":[15],"rather":[16],"short":[17],"such":[18],"as":[19,69,112,114,128],"syllables,":[20],"phonemes":[21],"and":[22,37,106],"diphones.":[23],"However,":[24],"when":[25],"applied":[26],"to":[27,110],"large":[28],"speech":[29,40,79,103,124],"databases,":[30],"shorter":[31],"produce":[33],"more":[34,86],"voice-waveform":[35],"candidates":[36],"a":[38,92],"larger":[39],"database":[41],"cannot":[42],"be":[43],"used":[44],"without":[45],"narrow":[46],"pruning":[47,52],"for":[48],"practical":[49],"use.":[50],"Narrow":[51],"impairs":[53],"quality":[55],"synthesized":[58,80,90,102],"speech.":[59,116],"Here":[60],"author":[62],"examined":[63],"possibility":[65],"using":[67,126],"words":[68,127],"units.":[71,130],"Subjective":[72],"evaluations":[73],"indicated":[74],"that":[75,89],"70%":[76],"by":[81,91],"proposed":[83],"method":[84],"sounded":[85],"natural":[87,113],"than":[88],"conventional":[93],"method.":[94],"The":[95],"five-point":[96],"mean":[97],"opinion":[98],"score":[99],"was":[104,108],"3.5,":[105],"21%":[107],"judged":[109],"sound":[111],"human":[115],"These":[117],"results":[118],"demonstrate":[119],"effectiveness":[121],"synthesis":[125]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
