{"id":"https://openalex.org/W4391745456","doi":"https://doi.org/10.1186/s13636-024-00329-7","title":"Deep learning-based expressive speech synthesis: a systematic review of approaches, challenges, and resources","display_name":"Deep learning-based expressive speech synthesis: a systematic review of approaches, challenges, and resources","publication_year":2024,"publication_date":"2024-02-12","ids":{"openalex":"https://openalex.org/W4391745456","doi":"https://doi.org/10.1186/s13636-024-00329-7"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-024-00329-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-024-00329-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-024-00329-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"review","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-024-00329-7","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002336064","display_name":"Huda Mohammed Barakat","orcid":"https://orcid.org/0000-0002-7585-4970"},"institutions":[{"id":"https://openalex.org/I44925452","display_name":"\u00d6zye\u011fin University","ror":"https://ror.org/01jjhfr75","country_code":"TR","type":"education","lineage":["https://openalex.org/I44925452"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Huda Barakat","raw_affiliation_strings":["Department of Computer Science, Ozyegin University, Istanbul, 34794, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-7585-4970","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Ozyegin University, Istanbul, 34794, Turkey","institution_ids":["https://openalex.org/I44925452"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046810738","display_name":"Oytun T\u00fcrk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oytun Turk","raw_affiliation_strings":["Independent Consultant/Researcher, Beaverton, OR, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Independent Consultant/Researcher, Beaverton, OR, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016845689","display_name":"Cenk Demiro\u011flu","orcid":"https://orcid.org/0000-0002-6160-3169"},"institutions":[{"id":"https://openalex.org/I44925452","display_name":"\u00d6zye\u011fin University","ror":"https://ror.org/01jjhfr75","country_code":"TR","type":"education","lineage":["https://openalex.org/I44925452"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Cenk Demiroglu","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Ozyegin University, Istanbul, 34794, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Ozyegin University, Istanbul, 34794, Turkey","institution_ids":["https://openalex.org/I44925452"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5002336064"],"corresponding_institution_ids":["https://openalex.org/I44925452"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":13.1642,"has_fulltext":true,"cited_by_count":43,"citation_normalized_percentile":{"value":0.99020629,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"2024","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.735358715057373},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.6057409644126892},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5873172879219055},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5553605556488037},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5154584050178528},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4502165615558624},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.34416788816452026}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.735358715057373},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.6057409644126892},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5873172879219055},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5553605556488037},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5154584050178528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4502165615558624},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.34416788816452026},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1186/s13636-024-00329-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-024-00329-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-024-00329-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:5b52f0fa4f1c4dc1b8a60b673b757b76","is_oa":true,"landing_page_url":"https://doaj.org/article/5b52f0fa4f1c4dc1b8a60b673b757b76","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing, Vol 2024, Iss 1, Pp 1-34 (2024)","raw_type":"article"},{"id":"pmh:oai:eresearch.ozyegin.edu.tr:10679/9221","is_oa":true,"landing_page_url":"http://hdl.handle.net/10679/9221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400232","display_name":"ECS Journal of Solid State Science and Technology (The Electrochemical Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2802273670","host_organization_name":"Electrochemical Society","host_organization_lineage":["https://openalex.org/I2802273670"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/review"}],"best_oa_location":{"id":"doi:10.1186/s13636-024-00329-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-024-00329-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-024-00329-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6100000143051147,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4391745456.pdf"},"referenced_works_count":148,"referenced_works":["https://openalex.org/W2043003570","https://openalex.org/W2090777335","https://openalex.org/W2102003408","https://openalex.org/W2149628368","https://openalex.org/W2294130536","https://openalex.org/W2471520273","https://openalex.org/W2475287302","https://openalex.org/W2550497374","https://openalex.org/W2572730214","https://openalex.org/W2752782242","https://openalex.org/W2752796333","https://openalex.org/W2760103357","https://openalex.org/W2785364623","https://openalex.org/W2793479148","https://openalex.org/W2802968248","https://openalex.org/W2885800352","https://openalex.org/W2889092828","https://openalex.org/W2889141918","https://openalex.org/W2890287821","https://openalex.org/W2890606114","https://openalex.org/W2894755406","https://openalex.org/W2896886065","https://openalex.org/W2904459034","https://openalex.org/W2914049472","https://openalex.org/W2937870435","https://openalex.org/W2941649920","https://openalex.org/W2962691331","https://openalex.org/W2963609956","https://openalex.org/W2964138190","https://openalex.org/W2964243274","https://openalex.org/W2966387353","https://openalex.org/W2972359262","https://openalex.org/W2972956431","https://openalex.org/W2976159681","https://openalex.org/W2976532777","https://openalex.org/W2984342455","https://openalex.org/W2990883660","https://openalex.org/W3003284013","https://openalex.org/W3007067948","https://openalex.org/W3008691130","https://openalex.org/W3010916717","https://openalex.org/W3015212100","https://openalex.org/W3015645837","https://openalex.org/W3015796413","https://openalex.org/W3015841875","https://openalex.org/W3016021263","https://openalex.org/W3022876224","https://openalex.org/W3027876491","https://openalex.org/W3032080156","https://openalex.org/W3047443559","https://openalex.org/W3081488690","https://openalex.org/W3095401840","https://openalex.org/W3095491807","https://openalex.org/W3095505419","https://openalex.org/W3096830101","https://openalex.org/W3097003111","https://openalex.org/W3097795905","https://openalex.org/W3097892637","https://openalex.org/W3100400819","https://openalex.org/W3107262928","https://openalex.org/W3112336664","https://openalex.org/W3127721277","https://openalex.org/W3135644023","https://openalex.org/W3139170550","https://openalex.org/W3146550708","https://openalex.org/W3152136404","https://openalex.org/W3153370059","https://openalex.org/W3158374895","https://openalex.org/W3160329778","https://openalex.org/W3160844600","https://openalex.org/W3161113899","https://openalex.org/W3161492781","https://openalex.org/W3161732385","https://openalex.org/W3161822901","https://openalex.org/W3162791003","https://openalex.org/W3163003432","https://openalex.org/W3163339651","https://openalex.org/W3168542456","https://openalex.org/W3174285493","https://openalex.org/W3184324824","https://openalex.org/W3184592700","https://openalex.org/W3194208059","https://openalex.org/W3195366750","https://openalex.org/W3196843885","https://openalex.org/W3196866316","https://openalex.org/W3197113339","https://openalex.org/W3197216873","https://openalex.org/W3197704090","https://openalex.org/W3198104520","https://openalex.org/W3198123658","https://openalex.org/W3198311967","https://openalex.org/W3198609073","https://openalex.org/W3198791321","https://openalex.org/W3200756692","https://openalex.org/W3202098869","https://openalex.org/W3203313352","https://openalex.org/W3205316472","https://openalex.org/W3205631867","https://openalex.org/W3207354624","https://openalex.org/W3209059054","https://openalex.org/W4205742757","https://openalex.org/W4210723584","https://openalex.org/W4210777104","https://openalex.org/W4214883111","https://openalex.org/W4221165968","https://openalex.org/W4221167022","https://openalex.org/W4224924088","https://openalex.org/W4224926192","https://openalex.org/W4224928640","https://openalex.org/W4225300652","https://openalex.org/W4225306880","https://openalex.org/W4226421465","https://openalex.org/W4226487411","https://openalex.org/W4243499798","https://openalex.org/W4281562038","https://openalex.org/W4283689139","https://openalex.org/W4283771593","https://openalex.org/W4287212799","https://openalex.org/W4293523272","https://openalex.org/W4294311176","https://openalex.org/W4295036296","https://openalex.org/W4296068776","https://openalex.org/W4296069154","https://openalex.org/W4297536219","https://openalex.org/W4297841505","https://openalex.org/W4297841795","https://openalex.org/W4297841867","https://openalex.org/W4308273487","https://openalex.org/W4309874973","https://openalex.org/W4313155892","https://openalex.org/W4319985616","https://openalex.org/W4323896824","https://openalex.org/W4372260289","https://openalex.org/W4372266971","https://openalex.org/W4372346370","https://openalex.org/W6600013530","https://openalex.org/W6600274115","https://openalex.org/W6600274734","https://openalex.org/W6600424091","https://openalex.org/W6600473098","https://openalex.org/W6600741150","https://openalex.org/W6602226494","https://openalex.org/W6603173416","https://openalex.org/W6607786901","https://openalex.org/W6632668414","https://openalex.org/W6634817459","https://openalex.org/W6756821666","https://openalex.org/W6778883912"],"related_works":["https://openalex.org/W4375867731","https://openalex.org/W2611989081","https://openalex.org/W4230611425","https://openalex.org/W2731899572","https://openalex.org/W4304166257","https://openalex.org/W4294635752","https://openalex.org/W4383066092","https://openalex.org/W3215138031","https://openalex.org/W2804383999","https://openalex.org/W2802049774"],"abstract_inverted_index":{"Abstract":[0],"Speech":[1],"synthesis":[2,91,107],"has":[3],"made":[4],"significant":[5],"strides":[6],"thanks":[7],"to":[8,14,25,74,160,191,201,204],"the":[9,23,38,102,111,147,157,167,170],"transition":[10],"from":[11],"machine":[12],"learning":[13,16],"deep":[15,123],"models.":[17],"Contemporary":[18],"text-to-speech":[19],"(TTS)":[20],"models":[21,57,87,108,133,139],"possess":[22],"capability":[24],"generate":[26],"speech":[27,49,64,90,106],"of":[28,41,101,138,196],"exceptionally":[29],"high":[30],"quality,":[31],"closely":[32],"mimicking":[33],"human":[34,75],"speech.":[35,76],"Nevertheless,":[36],"given":[37],"wide":[39],"array":[40],"applications":[42],"now":[43],"employing":[44],"TTS":[45,56],"models,":[46],"mere":[47],"high-quality":[48],"generation":[50],"is":[51,190],"no":[52],"longer":[53],"sufficient.":[54],"Present-day":[55],"must":[58],"also":[59],"excel":[60],"at":[61],"producing":[62],"expressive":[63,89,105],"that":[65,181],"can":[66],"convey":[67],"various":[68],"speaking":[69],"styles":[70],"and":[71,134,155,207],"emotions,":[72],"akin":[73],"Consequently,":[77],"researchers":[78,206],"have":[79],"concentrated":[80],"their":[81],"efforts":[82],"on":[83,104,119,122],"developing":[84],"more":[85],"efficient":[86],"for":[88,131],"in":[92,151,166,178,210],"recent":[93],"years.":[94],"This":[95],"paper":[96],"presents":[97],"a":[98,116,127],"systematic":[99],"review":[100],"literature":[103],"published":[109],"within":[110],"last":[112],"5":[113],"years,":[114],"with":[115,187],"particular":[117],"emphasis":[118],"approaches":[120],"based":[121],"learning.":[124],"We":[125],"offer":[126,202],"comprehensive":[128],"classification":[129],"scheme":[130],"these":[132,162],"provide":[135],"concise":[136],"descriptions":[137],"falling":[140],"into":[141],"each":[142],"category.":[143],"Additionally,":[144],"we":[145,173],"summarize":[146],"principal":[148],"challenges":[149,163],"encountered":[150],"this":[152,179,188,197,211],"research":[153,176,199],"domain":[154],"outline":[156],"strategies":[158],"employed":[159],"tackle":[161],"as":[164],"documented":[165],"literature.":[168],"In":[169],"Section":[171],"8,":[172],"pinpoint":[174],"some":[175],"gaps":[177],"field":[180],"necessitate":[182],"further":[183],"exploration.":[184],"Our":[185],"objective":[186],"work":[189],"give":[192],"an":[193],"all-encompassing":[194],"overview":[195],"hot":[198],"area":[200],"guidance":[203],"interested":[205],"future":[208],"endeavors":[209],"field.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":29},{"year":2024,"cited_by_count":5}],"updated_date":"2026-06-10T14:10:52.464848","created_date":"2025-10-10T00:00:00"}
