{"id":"https://openalex.org/W2920970185","doi":"https://doi.org/10.23919/apsipa.2018.8659652","title":"TDNN-Based Multilingual Mix-Synthesis with Language Discriminative Training","display_name":"TDNN-Based Multilingual Mix-Synthesis with Language Discriminative Training","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2920970185","doi":"https://doi.org/10.23919/apsipa.2018.8659652","mag":"2920970185"},"language":"en","primary_location":{"id":"doi:10.23919/apsipa.2018.8659652","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apsipa.2018.8659652","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044229820","display_name":"Gulijiamali Maimaitiaili","orcid":"https://orcid.org/0009-0005-2212-9344"},"institutions":[{"id":"https://openalex.org/I1334729051","display_name":"Xinjiang Normal University","ror":"https://ror.org/00ndrvk93","country_code":"CN","type":"education","lineage":["https://openalex.org/I1334729051"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gulijiamali Maimaitiaili","raw_affiliation_strings":["School of Mathematical Science, Xinjiang Normal University, Urumqi, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Science, Xinjiang Normal University, Urumqi, China","institution_ids":["https://openalex.org/I1334729051"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100352621","display_name":"Zhiyong Zhang","orcid":"https://orcid.org/0000-0003-3061-7768"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Zhang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012159935","display_name":"Aisikaer Rouzi","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aisikaer Rouzi","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5044229820"],"corresponding_institution_ids":["https://openalex.org/I1334729051"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18940832,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"605","last_page":"610"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8788819313049316},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8369676470756531},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5880993008613586},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5655707716941833},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.537445604801178},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5346839427947998},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4945501983165741},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49425840377807617},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4930996596813202},{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.44823381304740906},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.44210225343704224},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.43229156732559204},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2152320146560669}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8788819313049316},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8369676470756531},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5880993008613586},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5655707716941833},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.537445604801178},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5346839427947998},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4945501983165741},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49425840377807617},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4930996596813202},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.44823381304740906},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.44210225343704224},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.43229156732559204},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2152320146560669},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/apsipa.2018.8659652","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apsipa.2018.8659652","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7599999904632568,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1499332833","https://openalex.org/W1524333225","https://openalex.org/W1570874634","https://openalex.org/W1576227399","https://openalex.org/W1613141907","https://openalex.org/W1989549063","https://openalex.org/W1990505856","https://openalex.org/W1997449813","https://openalex.org/W2020024436","https://openalex.org/W2045158511","https://openalex.org/W2079623482","https://openalex.org/W2102003408","https://openalex.org/W2117671523","https://openalex.org/W2129142580","https://openalex.org/W2134973740","https://openalex.org/W2294797155","https://openalex.org/W2398462115","https://openalex.org/W2400517318","https://openalex.org/W2402146185","https://openalex.org/W2471520273","https://openalex.org/W2598638573","https://openalex.org/W2605320104","https://openalex.org/W2636064478","https://openalex.org/W2759925408","https://openalex.org/W2786149683","https://openalex.org/W6631362777","https://openalex.org/W6675380101","https://openalex.org/W6696843773","https://openalex.org/W6712869911","https://openalex.org/W6736204136"],"related_works":["https://openalex.org/W2990005675","https://openalex.org/W2374317326","https://openalex.org/W1603321096","https://openalex.org/W2394766824","https://openalex.org/W2078713291","https://openalex.org/W2361574037","https://openalex.org/W2386292991","https://openalex.org/W2364440891","https://openalex.org/W2113687551","https://openalex.org/W2112752961"],"abstract_inverted_index":{"We":[0],"propose":[1],"to":[2,49,64,120,123,135],"build":[3],"a":[4,75],"time":[5],"delay":[6],"neural":[7,78],"network":[8,41,52,79],"based,":[9],"Mandarin":[10],"and":[11,36,70,104,110,132],"Uyghur,":[12],"bilingual":[13],"TTS":[14],"system.":[15],"To":[16],"facilitate":[17],"the":[18,22,72,81,89,97,125,137],"phone":[19],"sharing":[20,38],"across":[21],"two":[23],"languages,":[24,114],"we":[25],"design":[26],"multilingual":[27,90,105],"question":[28],"set,":[29],"which":[30],"includes":[31],"language":[32,34,43,99,115],"specific,":[33],"independent":[35],"IPA":[37],"questions.":[39],"Neural":[40],"based":[42],"discriminative":[44,57,100,116],"approach":[45],"is":[46,59],"also":[47,118],"used":[48],"get":[50],"better":[51],"output":[53,73,82,138],"during":[54],"mix-training.":[55],"Language":[56],"information":[58],"augmented":[60],"as":[61],"auxiliary":[62],"feature":[63],"linguistic":[65,127],"features":[66,128],"at":[67,80],"input":[68],"level":[69],"control":[71,136],"of":[74],"feed-forward":[76],"deep":[77],"layer.":[83],"Preliminary":[84],"experimental":[85],"results":[86],"show":[87,119],"that":[88],"mix-synthesis":[91],"models":[92],"can":[93,133],"be":[94,121],"constructed":[95],"using":[96],"proposed":[98],"training":[101],"architecture.":[102],"Monolingual":[103],"system":[106],"performance":[107],"are":[108],"evaluated":[109],"compared":[111],"for":[112],"both":[113],"codes":[117],"efficient":[122],"distinguish":[124],"contextual":[126],"from":[129],"different":[130],"languages":[131],"help":[134],"features.":[139]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
