{"id":"https://openalex.org/W2990384275","doi":"https://doi.org/10.1109/access.2019.2954342","title":"Deep Learning for Mandarin-Tibetan Cross-Lingual Speech Synthesis","display_name":"Deep Learning for Mandarin-Tibetan Cross-Lingual Speech Synthesis","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2990384275","doi":"https://doi.org/10.1109/access.2019.2954342","mag":"2990384275"},"language":"en","primary_location":{"id":"doi:10.1109/access.2019.2954342","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2954342","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08906089.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08906089.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060794156","display_name":"Weizhao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I68986083","display_name":"Northwest Normal University","ror":"https://ror.org/00gx3j908","country_code":"CN","type":"education","lineage":["https://openalex.org/I68986083"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weizhao Zhang","raw_affiliation_strings":["College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","National and Provincial Joint Engineering Laboratory of Learning Analysis Technology in Online Education, Lanzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]},{"raw_affiliation_string":"National and Provincial Joint Engineering Laboratory of Learning Analysis Technology in Online Education, Lanzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032919424","display_name":"Hongwu Yang","orcid":"https://orcid.org/0000-0002-8939-3386"},"institutions":[{"id":"https://openalex.org/I68986083","display_name":"Northwest Normal University","ror":"https://ror.org/00gx3j908","country_code":"CN","type":"education","lineage":["https://openalex.org/I68986083"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongwu Yang","raw_affiliation_strings":["College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","National and Provincial Joint Engineering Laboratory of Learning Analysis Technology in Online Education, Lanzhou, China","School of Educational Technology, Northwest Normal University, Lanzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]},{"raw_affiliation_string":"National and Provincial Joint Engineering Laboratory of Learning Analysis Technology in Online Education, Lanzhou, China","institution_ids":[]},{"raw_affiliation_string":"School of Educational Technology, Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017728921","display_name":"Xiaolong Bu","orcid":"https://orcid.org/0000-0003-1983-4251"},"institutions":[{"id":"https://openalex.org/I68986083","display_name":"Northwest Normal University","ror":"https://ror.org/00gx3j908","country_code":"CN","type":"education","lineage":["https://openalex.org/I68986083"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolong Bu","raw_affiliation_strings":["College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101631202","display_name":"Lili Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I68986083","display_name":"Northwest Normal University","ror":"https://ror.org/00gx3j908","country_code":"CN","type":"education","lineage":["https://openalex.org/I68986083"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lili Wang","raw_affiliation_strings":["College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Physics and Electronic Engineering, Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5060794156"],"corresponding_institution_ids":["https://openalex.org/I68986083"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.3006,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.86036443,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"7","issue":null,"first_page":"167884","last_page":"167894"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.8918882608413696},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8356021642684937},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.689223051071167},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5211610794067383},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.45944276452064514},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.44893819093704224},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.44334715604782104},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42986100912094116},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1889440417289734}],"concepts":[{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.8918882608413696},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8356021642684937},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.689223051071167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5211610794067383},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.45944276452064514},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.44893819093704224},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44334715604782104},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42986100912094116},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1889440417289734},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2019.2954342","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2954342","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08906089.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:90efe70147fe4bdbae708d94b981f946","is_oa":true,"landing_page_url":"https://doaj.org/article/90efe70147fe4bdbae708d94b981f946","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 7, Pp 167884-167894 (2019)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2019.2954342","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2019.2954342","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8600701/08906089.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7699999809265137,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5867887195","display_name":null,"funder_award_id":"11664036","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2990384275.pdf","grobid_xml":"https://content.openalex.org/works/W2990384275.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W40001856","https://openalex.org/W1492383498","https://openalex.org/W1570923747","https://openalex.org/W1572989473","https://openalex.org/W2014869452","https://openalex.org/W2043003570","https://openalex.org/W2064675550","https://openalex.org/W2081254602","https://openalex.org/W2102003408","https://openalex.org/W2111284386","https://openalex.org/W2129142580","https://openalex.org/W2147880316","https://openalex.org/W2150658333","https://openalex.org/W2294797155","https://openalex.org/W2296283641","https://openalex.org/W2323187260","https://openalex.org/W2380370523","https://openalex.org/W2398071208","https://openalex.org/W2400517318","https://openalex.org/W2471520273","https://openalex.org/W2511703664","https://openalex.org/W2574456902","https://openalex.org/W2588359766","https://openalex.org/W2751205669","https://openalex.org/W2759465110","https://openalex.org/W2922185715","https://openalex.org/W2937909162","https://openalex.org/W2963609956","https://openalex.org/W2964243274","https://openalex.org/W4235154690","https://openalex.org/W6601627100","https://openalex.org/W6634186343","https://openalex.org/W6682082992","https://openalex.org/W6696843773","https://openalex.org/W6732764752","https://openalex.org/W6736204136"],"related_works":["https://openalex.org/W2990005675","https://openalex.org/W2374317326","https://openalex.org/W1603321096","https://openalex.org/W2394766824","https://openalex.org/W2078713291","https://openalex.org/W2361574037","https://openalex.org/W2386292991","https://openalex.org/W2364440891","https://openalex.org/W2393726922","https://openalex.org/W2366752344"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,21,38,45,83,102,105,112,118,123,145,187,267],"deep":[4,57],"learning-based":[5],"Mandarin-Tibetan":[6],"cross-lingual":[7,218,228,254],"speech":[8,14,18,140,203,219,255,283],"synthesis":[9,15,19,141,220,256,284],"to":[10,30,143,172,265],"realize":[11],"both":[12,134],"Mandarin":[13,41,135,161,183,199,207,248],"and":[16,44,66,122,130,136,157,162,230],"Tibetan":[17,25,48,84,95,98,107,137,163,185,202,209,232,237,272],"under":[20],"unique":[22],"framework.":[23,234,274],"Because":[24],"training":[26,238,263],"corpus":[27,43,191,239,264],"is":[28,170,222],"hard":[29],"record,":[31],"we":[32,196],"train":[33,144,173],"the":[34,128,131,139,167,198,205,215,225,231,243,251,262,271,276,291],"acoustic":[35,52],"models":[36,53,181],"with":[37,56,114,153,186],"large":[39],"scale":[40,47],"multi-speaker":[42],"small":[46,188],"one-speaker":[49],"corpus.":[50,165,296],"The":[51,97,211,235],"are":[54],"trained":[55],"neural":[58],"network":[59],"(DNN),":[60],"hybrid":[61,67,155,158,176,179,216,252],"long":[62,69],"short-term":[63,70],"memory":[64,71],"(LSTM),":[65],"bi-directional":[68],"(BLSTM).":[72],"We":[73,126],"also":[74],"further":[75],"extend":[76],"our":[77],"Chinese":[78,93],"text":[79,85,99,103],"analyzer":[80,86,100],"by":[81,289],"adding":[82],"for":[87,282],"generating":[88],"context-dependent":[89],"labels":[90],"from":[91,160,192],"input":[92],"or":[94,178,184,201,208],"sentences.":[96],"includes":[101],"normalization,":[104],"novel":[106],"word":[108],"segmentation":[109],"that":[110,214],"combines":[111],"BLSTM":[113,159,180],"conditional":[115],"random":[116],"field,":[117],"prosodic":[119],"boundary":[120],"prediction,":[121],"grapheme-to-phoneme":[124],"conversion.":[125],"select":[127],"initials":[129],"finals":[132],"of":[133,182,246,261,285],"as":[138,270],"units":[142],"speaker-independent":[146],"mixed":[147,164,236],"language":[148],"average":[149],"voice":[150,244,269],"model":[151],"(AVM)":[152],"DNN,":[154,175],"LSTM,":[156,177],"Then":[166],"speaker":[168,190],"adaptation":[169],"applied":[171],"speaker-dependent":[174,206],"target":[189],"an":[193],"AVM.":[194],"Finally,":[195],"synthesize":[197,266],"speech,":[200],"though":[204],"models.":[210],"experiments":[212],"show":[213],"BLSTM-based":[217,253],"framework":[221,257],"better":[223],"than":[224],"other":[226],"two":[227],"frameworks":[229],"monolingual":[233,273],"does":[240],"not":[241],"influence":[242],"quality":[245],"synthesized":[247],"speech.":[249],"Furthermore,":[250],"only":[258],"needs":[259],"60%":[260],"similar":[268],"Therefore,":[275],"proposed":[277],"method":[278],"can":[279],"be":[280],"used":[281],"low":[286],"resource":[287,294],"languages":[288],"borrowing":[290],"same":[292],"tremendous":[293],"language's":[295]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":2}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
