{"id":"https://openalex.org/W3090474612","doi":"https://doi.org/10.1109/access.2020.3027619","title":"Hierarchical Transfer Learning for Multilingual, Multi-Speaker, and Style Transfer DNN-Based TTS on Low-Resource Languages","display_name":"Hierarchical Transfer Learning for Multilingual, Multi-Speaker, and Style Transfer DNN-Based TTS on Low-Resource Languages","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3090474612","doi":"https://doi.org/10.1109/access.2020.3027619","mag":"3090474612"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3027619","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027619","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09208651.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09208651.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066073372","display_name":"Kurniawati Azizah","orcid":"https://orcid.org/0000-0002-3217-7025"},"institutions":[{"id":"https://openalex.org/I29617571","display_name":"University of Indonesia","ror":"https://ror.org/0116zj450","country_code":"ID","type":"education","lineage":["https://openalex.org/I29617571"]}],"countries":["ID"],"is_corresponding":true,"raw_author_name":"Kurniawati Azizah","raw_affiliation_strings":["Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia"],"raw_orcid":"https://orcid.org/0000-0002-3217-7025","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia","institution_ids":["https://openalex.org/I29617571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052754690","display_name":"Mirna Adriani","orcid":null},"institutions":[{"id":"https://openalex.org/I29617571","display_name":"University of Indonesia","ror":"https://ror.org/0116zj450","country_code":"ID","type":"education","lineage":["https://openalex.org/I29617571"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Mirna Adriani","raw_affiliation_strings":["Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia","institution_ids":["https://openalex.org/I29617571"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069933043","display_name":"Wisnu Jatmiko","orcid":"https://orcid.org/0000-0002-0530-7955"},"institutions":[{"id":"https://openalex.org/I29617571","display_name":"University of Indonesia","ror":"https://ror.org/0116zj450","country_code":"ID","type":"education","lineage":["https://openalex.org/I29617571"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Wisnu Jatmiko","raw_affiliation_strings":["Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia"],"raw_orcid":"https://orcid.org/0000-0002-0530-7955","affiliations":[{"raw_affiliation_string":"Faculty of Computer Science, Universitas Indonesia, Depok, Indonesia","institution_ids":["https://openalex.org/I29617571"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5066073372"],"corresponding_institution_ids":["https://openalex.org/I29617571"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.8559,"has_fulltext":true,"cited_by_count":33,"citation_normalized_percentile":{"value":0.92605634,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"8","issue":null,"first_page":"179798","last_page":"179812"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7691643834114075},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.6343590617179871},{"id":"https://openalex.org/keywords/indonesian","display_name":"Indonesian","score":0.5779920816421509},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.5491528511047363},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5294952988624573},{"id":"https://openalex.org/keywords/mean-opinion-score","display_name":"Mean opinion score","score":0.49665313959121704},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4936750829219818},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47204315662384033},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.33591991662979126},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2719356417655945}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7691643834114075},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.6343590617179871},{"id":"https://openalex.org/C2779207338","wikidata":"https://www.wikidata.org/wiki/Q9240","display_name":"Indonesian","level":2,"score":0.5779920816421509},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.5491528511047363},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5294952988624573},{"id":"https://openalex.org/C62897895","wikidata":"https://www.wikidata.org/wiki/Q1915482","display_name":"Mean opinion score","level":3,"score":0.49665313959121704},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4936750829219818},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47204315662384033},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33591991662979126},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2719356417655945},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3027619","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027619","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09208651.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:9a68402e86984b9d8c52cec2298d2fbb","is_oa":true,"landing_page_url":"https://doaj.org/article/9a68402e86984b9d8c52cec2298d2fbb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 179798-179812 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3027619","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3027619","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09208651.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6899999976158142}],"awards":[{"id":"https://openalex.org/G1524716514","display_name":null,"funder_award_id":"RST/HKP.05.00/2020","funder_id":"https://openalex.org/F4320323819","funder_display_name":"Universitas Indonesia"},{"id":"https://openalex.org/G6349052386","display_name":null,"funder_award_id":"NKB-566/UN2.RST/HKP.05.00/2020","funder_id":"https://openalex.org/F4320323819","funder_display_name":"Universitas Indonesia"},{"id":"https://openalex.org/G7379709468","display_name":null,"funder_award_id":"00/2020","funder_id":"https://openalex.org/F4320323819","funder_display_name":"Universitas Indonesia"}],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320323819","display_name":"Universitas Indonesia","ror":"https://ror.org/0116zj450"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3090474612.pdf","grobid_xml":"https://content.openalex.org/works/W3090474612.grobid-xml"},"referenced_works_count":77,"referenced_works":["https://openalex.org/W854541894","https://openalex.org/W1522301498","https://openalex.org/W1570629387","https://openalex.org/W1579838312","https://openalex.org/W2084609288","https://openalex.org/W2091425152","https://openalex.org/W2095734449","https://openalex.org/W2102003408","https://openalex.org/W2107740512","https://openalex.org/W2107860279","https://openalex.org/W2111284386","https://openalex.org/W2130086727","https://openalex.org/W2133564696","https://openalex.org/W2153914468","https://openalex.org/W2165698076","https://openalex.org/W2338517121","https://openalex.org/W2395579298","https://openalex.org/W2591927543","https://openalex.org/W2619368999","https://openalex.org/W2739077999","https://openalex.org/W2743452000","https://openalex.org/W2769810959","https://openalex.org/W2775336875","https://openalex.org/W2794490148","https://openalex.org/W2795109282","https://openalex.org/W2887280559","https://openalex.org/W2889028433","https://openalex.org/W2895654193","https://openalex.org/W2906459023","https://openalex.org/W2910199258","https://openalex.org/W2913818371","https://openalex.org/W2914049472","https://openalex.org/W2919358988","https://openalex.org/W2921135010","https://openalex.org/W2928389720","https://openalex.org/W2939833446","https://openalex.org/W2942231644","https://openalex.org/W2962699523","https://openalex.org/W2963027641","https://openalex.org/W2963300588","https://openalex.org/W2963331137","https://openalex.org/W2963403868","https://openalex.org/W2963609956","https://openalex.org/W2963691546","https://openalex.org/W2963712897","https://openalex.org/W2963782041","https://openalex.org/W2963927338","https://openalex.org/W2963945466","https://openalex.org/W2964121744","https://openalex.org/W2964243274","https://openalex.org/W2964281804","https://openalex.org/W2964308564","https://openalex.org/W2969521066","https://openalex.org/W2969856879","https://openalex.org/W2973034126","https://openalex.org/W2976159681","https://openalex.org/W2993078836","https://openalex.org/W3010945169","https://openalex.org/W3015645837","https://openalex.org/W3028613123","https://openalex.org/W3109182305","https://openalex.org/W4294619240","https://openalex.org/W4295731579","https://openalex.org/W4385245566","https://openalex.org/W6623517193","https://openalex.org/W6631190155","https://openalex.org/W6674565674","https://openalex.org/W6675380101","https://openalex.org/W6675938391","https://openalex.org/W6679434410","https://openalex.org/W6734815144","https://openalex.org/W6738277540","https://openalex.org/W6739901393","https://openalex.org/W6749489859","https://openalex.org/W6750489868","https://openalex.org/W6778159118","https://openalex.org/W6786584023"],"related_works":["https://openalex.org/W4242621793","https://openalex.org/W648807974","https://openalex.org/W4229837155","https://openalex.org/W4236086937","https://openalex.org/W2294302573","https://openalex.org/W4312419881","https://openalex.org/W2086953810","https://openalex.org/W2512763533","https://openalex.org/W2151415191","https://openalex.org/W2151664070"],"abstract_inverted_index":{"This":[0],"work":[1],"applies":[2],"a":[3,23,46,58,75,79,118,129,156,176,234,250,271],"hierarchical":[4],"transfer":[5,60,110,133,194,267],"learning":[6,61,111],"to":[7,63,117,128,227,244,254],"implement":[8],"deep":[9],"neural":[10],"network":[11,253],"(DNN)-based":[12],"multilingual":[13,81,119,126,130,153],"text-to-speech":[14],"(TTS)":[15],"for":[16,39,50,68,163,170,210],"low-resource":[17,51,69,84,98,229],"languages.":[18,52,70,85],"DNN-based":[19,33],"system":[20],"typically":[21],"requires":[22],"large":[24],"amount":[25,236],"of":[26,74,83,146,151,161,178,205,237],"training":[27,238],"data.":[28],"In":[29,53],"recent":[30],"years,":[31],"while":[32],"TTS":[34,66,89,116,120,127,154,197,252],"has":[35],"made":[36],"remarkable":[37],"results":[38,217],"high-resource":[40,76,92],"languages,":[41],"it":[42,174],"still":[43],"suffers":[44],"from":[45,112,123,249,270],"data":[47],"scarcity":[48],"problem":[49],"this":[54],"article,":[55],"we":[56,106],"propose":[57],"multi-stage":[59],"strategy":[62,222],"train":[64],"our":[65,152,196,240],"model":[67,103,198],"We":[71],"make":[72],"use":[73],"language":[77,93,99],"and":[78,121,140,172,184,208,213,265],"joint":[80],"dataset":[82],"A":[86],"pre-trained":[87,114,125],"monolingual":[88,115],"on":[90,96,137],"the":[91,97,101,113,124,220,228,261],"is":[94],"fine-tuned":[95],"using":[100],"same":[102],"architecture.":[104],"Then,":[105],"apply":[107],"partial":[108],"network-based":[109],"finally":[122],"with":[131],"style":[132,193,269],"TTS.":[134],"Our":[135],"experiment":[136],"Indonesian,":[138,211],"Javanese,":[139,212],"Sundanese":[141,173],"languages":[142,230],"show":[143],"adequate":[144],"quality":[145],"synthesized":[147],"speech.":[148],"The":[149,216],"evaluation":[150],"reaches":[155,175,199],"mean":[157],"opinion":[158],"score":[159],"(MOS)":[160],"4.35":[162],"Indonesian":[164],"(ground":[165,180,186],"truth":[166,181,187],"=":[167,182,188],"4.36).":[168],"Whereas":[169],"Javanese":[171],"MOS":[177],"4.20":[179],"4.38)":[183],"4.28":[185],"4.20),":[189],"respectively.":[190,215],"For":[191],"parallel":[192],"evaluation,":[195],"an":[200],"F0":[201],"frame":[202],"error":[203],"(FFE)":[204],"9.08%,":[206],"10.13%,":[207],"8.43%":[209],"Sundanese,":[214],"indicate":[218],"that":[219],"proposed":[221],"can":[223],"be":[224],"effectively":[225],"applied":[226],"target":[231],"domain.":[232],"With":[233],"small":[235],"data,":[239],"models":[241],"are":[242],"able":[243],"learn":[245],"step":[246,248],"by":[247],"smaller":[251],"larger":[255],"networks,":[256],"produce":[257],"intelligible":[258],"speech":[259],"approaching":[260],"real":[262],"human":[263],"voice,":[264],"successfully":[266],"speaking":[268],"reference":[272],"audio.":[273]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":4}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
