{"id":"https://openalex.org/W2785466268","doi":"https://doi.org/10.1109/apsipa.2017.8282022","title":"Representing raw linguistic information in chinese text-to-speech system","display_name":"Representing raw linguistic information in chinese text-to-speech system","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2785466268","doi":"https://doi.org/10.1109/apsipa.2017.8282022","mag":"2785466268"},"language":"en","primary_location":{"id":"doi:10.1109/apsipa.2017.8282022","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2017.8282022","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021872761","display_name":"Minghui Dong","orcid":"https://orcid.org/0000-0001-6543-2929"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Minghui Dong","raw_affiliation_strings":["Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore"],"affiliations":[{"raw_affiliation_string":"Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057050780","display_name":"Zhengchen Zhang","orcid":"https://orcid.org/0009-0005-4225-3537"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhengchen Zhang","raw_affiliation_strings":["Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore"],"affiliations":[{"raw_affiliation_string":"Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110320609","display_name":"Huaiping Ming","orcid":null},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Huaiping Ming","raw_affiliation_strings":["Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore"],"affiliations":[{"raw_affiliation_string":"Human Language Technology Department, Institute for Infocomm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5021872761"],"corresponding_institution_ids":["https://openalex.org/I3005327000"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1996204,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"99","issue":null,"first_page":"167","last_page":"170"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.799262285232544},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6489297151565552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5845451951026917},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5531939268112183},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.47062447667121887},{"id":"https://openalex.org/keywords/pinyin","display_name":"Pinyin","score":0.465424507856369},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4569428861141205},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.44144514203071594},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.43806248903274536},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.43716636300086975},{"id":"https://openalex.org/keywords/text-segmentation","display_name":"Text segmentation","score":0.42508846521377563},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.320911705493927},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2838044762611389},{"id":"https://openalex.org/keywords/chinese-characters","display_name":"Chinese characters","score":0.28093862533569336}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.799262285232544},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6489297151565552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5845451951026917},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5531939268112183},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.47062447667121887},{"id":"https://openalex.org/C2781095461","wikidata":"https://www.wikidata.org/wiki/Q42222","display_name":"Pinyin","level":3,"score":0.465424507856369},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4569428861141205},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.44144514203071594},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.43806248903274536},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.43716636300086975},{"id":"https://openalex.org/C98501671","wikidata":"https://www.wikidata.org/wiki/Q1948408","display_name":"Text segmentation","level":3,"score":0.42508846521377563},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.320911705493927},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2838044762611389},{"id":"https://openalex.org/C2781051154","wikidata":"https://www.wikidata.org/wiki/Q8201","display_name":"Chinese characters","level":2,"score":0.28093862533569336},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipa.2017.8282022","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2017.8282022","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7599999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1571950845","https://openalex.org/W1578102511","https://openalex.org/W2102003408","https://openalex.org/W2181607856","https://openalex.org/W2335876948","https://openalex.org/W2400229727","https://openalex.org/W2471520273","https://openalex.org/W2525520955","https://openalex.org/W2526838772","https://openalex.org/W2901997113","https://openalex.org/W2996160789","https://openalex.org/W4235132546","https://openalex.org/W6634201745","https://openalex.org/W6634556219","https://openalex.org/W6686045668","https://openalex.org/W6756197946","https://openalex.org/W6772289264"],"related_works":["https://openalex.org/W2254356171","https://openalex.org/W2393940967","https://openalex.org/W2386957102","https://openalex.org/W644266459","https://openalex.org/W2159591557","https://openalex.org/W2385598138","https://openalex.org/W2346578824","https://openalex.org/W2366925922","https://openalex.org/W2115592387","https://openalex.org/W2905950556"],"abstract_inverted_index":{"In":[0,91],"this":[1,92],"paper,":[2,93],"we":[3,94,161,216],"propose":[4],"a":[5,133,136,152,156,169,208],"method":[6],"of":[7,66,76,147,158,164,181,191],"representing":[8],"linguistic":[9,17,104,193,205,226,239],"features":[10,18,105,194,206],"for":[11,19,42,87],"Chinese":[12,20,99,113,116,159],"text-to-speech":[13],"(TTS)":[14],"systems.":[15],"Traditional":[16],"TTS":[21,78,213],"include":[22],"information":[23],"about":[24],"the":[25,67,74,77,81,112,148,179,182,192,219,222,237,243,247],"related":[26],"phones,":[27],"syllables,":[28],"words,":[29,31],"prosodic":[30,32,47,50],"phrases,":[33],"etc.":[34,53],"Normally,":[35],"models":[36,68],"would":[37],"need":[38],"to":[39,102,130,144,167,177],"be":[40,142],"built":[41,176],"word":[43,48],"segmentation,":[44],"part-of-speech":[45],"tagging,":[46],"prediction,":[49,52],"phrase":[51],"To":[54,110,150],"train":[55],"these":[56],"models,":[57],"large":[58],"annotated":[59,82,108],"corpora":[60,83],"are":[61,84],"normally":[62],"needed.":[63],"The":[64,184],"quality":[65,75],"will":[69],"have":[70,201,217],"an":[71,131,173],"effect":[72],"on":[73],"system.":[79],"However,":[80],"often":[85],"unavailable":[86],"many":[88],"low-resource":[89],"languages.":[90],"encode":[95],"phone":[96,197],"sequences":[97,101],"and":[98,135,215,231],"character":[100,117,166],"form":[103,168],"without":[106],"using":[107,224],"corpora.":[109],"represent":[111,145,151],"sequences,":[114],"each":[115,146,165],"is":[118,127,175,187],"converted":[119],"into":[120],"its":[121],"pronunciation":[122],"(represented":[123],"by":[124],"Pinyin),":[125],"which":[126],"further":[128],"mapped":[129],"initial,":[132],"final":[134],"tone.":[137],"One-":[138],"hot":[139],"vectors":[140,163],"can":[141],"used":[143,188],"elements.":[149],"context":[153],"window":[154],"covering":[155],"sequence":[157,198],"characters,":[160],"concatenate":[162],"long":[170],"vector.":[171,183],"Then":[172],"autoencoder":[174],"reduce":[178],"dimension":[180],"compressed":[185],"vector":[186],"as":[189,246],"part":[190],"together":[195],"with":[196,221],"features.":[199,227,249],"We":[200],"applied":[202],"our":[203],"proposed":[204,238],"in":[207],"deep":[209],"neural":[210],"network":[211],"(DNN)-based":[212],"system,":[214],"compared":[218],"system":[220],"one":[223],"traditional":[225,248],"Both":[228],"objective":[229],"evaluation":[230],"subjective":[232],"listening":[233],"test":[234],"show":[235],"that":[236],"representation":[240],"achieves":[241],"almost":[242],"same":[244],"performance":[245]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
