{"id":"https://openalex.org/W4313123884","doi":"https://doi.org/10.1109/icspcc55723.2022.9984283","title":"A Comparison of Text Selection Algorithms for Sequence-to-Sequence Neural TTS","display_name":"A Comparison of Text Selection Algorithms for Sequence-to-Sequence Neural TTS","publication_year":2022,"publication_date":"2022-10-25","ids":{"openalex":"https://openalex.org/W4313123884","doi":"https://doi.org/10.1109/icspcc55723.2022.9984283"},"language":"en","primary_location":{"id":"doi:10.1109/icspcc55723.2022.9984283","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icspcc55723.2022.9984283","pdf_url":null,"source":{"id":"https://openalex.org/S4363608295","display_name":"2022 IEEE International Conference on Signal Processing, Communications and Computing (ICSPCC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Signal Processing, Communications and Computing (ICSPCC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024987550","display_name":"Stefan Taubert","orcid":"https://orcid.org/0000-0002-4932-2874"},"institutions":[{"id":"https://openalex.org/I2610724","display_name":"Chemnitz University of Technology","ror":"https://ror.org/00a208s56","country_code":"DE","type":"education","lineage":["https://openalex.org/I2610724"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Stefan Taubert","raw_affiliation_strings":["Chemnitz University of Technology,Department of Computer Science","Department of Computer Science, Chemnitz University of Technology"],"affiliations":[{"raw_affiliation_string":"Chemnitz University of Technology,Department of Computer Science","institution_ids":["https://openalex.org/I2610724"]},{"raw_affiliation_string":"Department of Computer Science, Chemnitz University of Technology","institution_ids":["https://openalex.org/I2610724"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030539771","display_name":"Jasmin Sternkopf","orcid":null},"institutions":[{"id":"https://openalex.org/I2610724","display_name":"Chemnitz University of Technology","ror":"https://ror.org/00a208s56","country_code":"DE","type":"education","lineage":["https://openalex.org/I2610724"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jasmin Sternkopf","raw_affiliation_strings":["Chemnitz University of Technology,Department of Mathematics","Department of Mathematics, Chemnitz University of Technology"],"affiliations":[{"raw_affiliation_string":"Chemnitz University of Technology,Department of Mathematics","institution_ids":["https://openalex.org/I2610724"]},{"raw_affiliation_string":"Department of Mathematics, Chemnitz University of Technology","institution_ids":["https://openalex.org/I2610724"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007734172","display_name":"Stefan Kahl","orcid":"https://orcid.org/0000-0002-2411-8877"},"institutions":[{"id":"https://openalex.org/I2610724","display_name":"Chemnitz University of Technology","ror":"https://ror.org/00a208s56","country_code":"DE","type":"education","lineage":["https://openalex.org/I2610724"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stefan Kahl","raw_affiliation_strings":["Chemnitz University of Technology,Department of Computer Science","Department of Computer Science, Chemnitz University of Technology"],"affiliations":[{"raw_affiliation_string":"Chemnitz University of Technology,Department of Computer Science","institution_ids":["https://openalex.org/I2610724"]},{"raw_affiliation_string":"Department of Computer Science, Chemnitz University of Technology","institution_ids":["https://openalex.org/I2610724"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071056491","display_name":"Maximilian Eibl","orcid":"https://orcid.org/0000-0002-9519-2708"},"institutions":[{"id":"https://openalex.org/I2610724","display_name":"Chemnitz University of Technology","ror":"https://ror.org/00a208s56","country_code":"DE","type":"education","lineage":["https://openalex.org/I2610724"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Maximilian Eibl","raw_affiliation_strings":["Chemnitz University of Technology,Department of Computer Science","Department of Computer Science, Chemnitz University of Technology"],"affiliations":[{"raw_affiliation_string":"Chemnitz University of Technology,Department of Computer Science","institution_ids":["https://openalex.org/I2610724"]},{"raw_affiliation_string":"Department of Computer Science, Chemnitz University of Technology","institution_ids":["https://openalex.org/I2610724"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5024987550"],"corresponding_institution_ids":["https://openalex.org/I2610724"],"apc_list":null,"apc_paid":null,"fwci":0.1046,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.3427678,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7226915955543518},{"id":"https://openalex.org/keywords/greedy-algorithm","display_name":"Greedy algorithm","score":0.6175930500030518},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5451979637145996},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5160529017448425},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.513981282711029},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4841323792934418},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.46633172035217285},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4270452857017517},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.42628684639930725},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.41757482290267944},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15683963894844055}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7226915955543518},{"id":"https://openalex.org/C51823790","wikidata":"https://www.wikidata.org/wiki/Q504353","display_name":"Greedy algorithm","level":2,"score":0.6175930500030518},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5451979637145996},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5160529017448425},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.513981282711029},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4841323792934418},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.46633172035217285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4270452857017517},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.42628684639930725},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.41757482290267944},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15683963894844055},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icspcc55723.2022.9984283","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icspcc55723.2022.9984283","pdf_url":null,"source":{"id":"https://openalex.org/S4363608295","display_name":"2022 IEEE International Conference on Signal Processing, Communications and Computing (ICSPCC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Signal Processing, Communications and Computing (ICSPCC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7599999904632568,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W42086565","https://openalex.org/W94997927","https://openalex.org/W167729977","https://openalex.org/W170732776","https://openalex.org/W207086513","https://openalex.org/W1525540417","https://openalex.org/W1965555277","https://openalex.org/W2022191808","https://openalex.org/W2062366414","https://openalex.org/W2107860279","https://openalex.org/W2129142580","https://openalex.org/W2162248535","https://openalex.org/W2220416654","https://openalex.org/W2296111744","https://openalex.org/W2749074593","https://openalex.org/W2889028433","https://openalex.org/W2889129899","https://openalex.org/W2948238043","https://openalex.org/W2963609956","https://openalex.org/W2964138190","https://openalex.org/W2964243274","https://openalex.org/W2972359262","https://openalex.org/W2972428935","https://openalex.org/W2972569067","https://openalex.org/W2972950048","https://openalex.org/W3015645837","https://openalex.org/W3025528898","https://openalex.org/W3026356812","https://openalex.org/W3081416955","https://openalex.org/W4212774754","https://openalex.org/W4299162499","https://openalex.org/W4391156274","https://openalex.org/W6727791074","https://openalex.org/W6752124048","https://openalex.org/W6763316926","https://openalex.org/W6763832098","https://openalex.org/W6778083308","https://openalex.org/W6778823374","https://openalex.org/W6917585676"],"related_works":["https://openalex.org/W1914543332","https://openalex.org/W2946856121","https://openalex.org/W2108985546","https://openalex.org/W2433276473","https://openalex.org/W2077992636","https://openalex.org/W1537411440","https://openalex.org/W2024201202","https://openalex.org/W2535215250","https://openalex.org/W2049083033","https://openalex.org/W290673751"],"abstract_inverted_index":{"Previous":[0],"research":[1],"demonstrated":[2],"that":[3,91,109],"text":[4],"selection":[5,80,90],"algorithms":[6,37],"applied":[7],"in":[8,127],"the":[9,33,39,53,59,105,110,122,142,151,156,160],"context":[10],"of":[11,35,41,74,162],"concatenative":[12],"and":[13,26,86,175],"parametric":[14],"text-to-speech":[15],"(TTS)":[16],"systems":[17,187],"were":[18],"able":[19],"to":[20,51,93,121,132,170],"increase":[21],"synthesis":[22],"quality":[23,40],"(i.e.,":[24],"intelligibility":[25],"naturalness).":[27],"In":[28],"this":[29],"work,":[30],"we":[31],"investigate":[32],"effects":[34],"such":[36],"on":[38,134],"a":[42,71,87,95],"sequence-to-sequence":[43],"neural":[44],"TTS":[45,186],"system":[46],"when":[47],"they":[48],"are":[49,65],"used":[50],"create":[52],"training":[54,68,133],"set.":[55],"We":[56,166],"compare":[57],"how":[58],"mel":[60],"spectrograms":[61],"generated":[62],"by":[63,67],"Tacotron":[64],"affected":[66],"sets":[69],"with":[70,104],"total":[72],"duration":[73],"six":[75],"hours":[76],"created":[77],"using":[78],"three":[79,136],"approaches:":[81],"random":[82,111],"selection,":[83,85],"greedy":[84,89,124,144],"modified":[88],"attempts":[92],"produce":[94],"uniform":[96],"symbol":[97],"distribution.":[98],"The":[99],"evaluation":[100],"was":[101],"done":[102],"objectively":[103],"mel-cepstral":[106],"distance,":[107],"showing":[108],"approach":[112,145,158],"did":[113],"not":[114],"give":[115],"favorable":[116],"results":[117,131,149],"at":[118],"all":[119],"compared":[120],"two":[123],"approaches,":[125],"which":[126,185],"turn":[128],"achieved":[129,146],"close":[130],"about":[135],"times":[137],"as":[138],"much":[139],"data.":[140],"Thereby,":[141],"second":[143],"significantly":[147],"better":[148],"than":[150],"first":[152],"one,":[153],"making":[154],"it":[155],"recommended":[157],"for":[159,181,184],"task":[161],"reading":[163],"script":[164],"creation.":[165],"expect":[167],"these":[168],"findings":[169],"help":[171],"build":[172],"shorter":[173],"scripts":[174],"thus":[176],"reduce":[177],"recording":[178],"costs,":[179],"especially":[180],"low-resource":[182],"languages":[183],"should":[188],"be":[189],"deployed.":[190]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
