{"id":"https://openalex.org/W4224903715","doi":"https://doi.org/10.21437/interspeech.2022-10689","title":"Exploration strategies for articulatory synthesis of complex syllable onsets","display_name":"Exploration strategies for articulatory synthesis of complex syllable onsets","publication_year":2022,"publication_date":"2022-09-16","ids":{"openalex":"https://openalex.org/W4224903715","doi":"https://doi.org/10.21437/interspeech.2022-10689"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2022-10689","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10689","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057837548","display_name":"Daniel van Niekerk","orcid":"https://orcid.org/0000-0002-7324-2751"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Daniel Van Niekerk","raw_affiliation_strings":["Department of Speech, Hearing and Phonetic Sciences, University College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Speech, Hearing and Phonetic Sciences, University College London, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022797639","display_name":"Anqi Xu","orcid":"https://orcid.org/0000-0002-4331-6676"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Anqi Xu","raw_affiliation_strings":["Department of Speech, Hearing and Phonetic Sciences, University College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Speech, Hearing and Phonetic Sciences, University College London, UK","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001239900","display_name":"Branislav Gerazov","orcid":"https://orcid.org/0000-0003-2498-6831"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Branislav Gerazov","raw_affiliation_strings":["Faculty of Electrical Engineering and Information Technologies, CMUS, Skopje, RN Macedonia"],"affiliations":[{"raw_affiliation_string":"Faculty of Electrical Engineering and Information Technologies, CMUS, Skopje, RN Macedonia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004916681","display_name":"Paul Konstantin Krug","orcid":"https://orcid.org/0000-0001-8518-8142"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"TU Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Paul Konstantin Krug","raw_affiliation_strings":["Institute of Acoustics and Speech Communication, Technische Universit\u00e4t Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics and Speech Communication, Technische Universit\u00e4t Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046141664","display_name":"Peter Birkholz","orcid":"https://orcid.org/0000-0003-0167-8123"},"institutions":[{"id":"https://openalex.org/I78650965","display_name":"TU Dresden","ror":"https://ror.org/042aqky30","country_code":"DE","type":"education","lineage":["https://openalex.org/I78650965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Peter Birkholz","raw_affiliation_strings":["Institute of Acoustics and Speech Communication, Technische Universit\u00e4t Dresden, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics and Speech Communication, Technische Universit\u00e4t Dresden, Germany","institution_ids":["https://openalex.org/I78650965"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100419183","display_name":"Yi Xu","orcid":"https://orcid.org/0000-0002-5768-8235"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yi Xu","raw_affiliation_strings":["Department of Speech, Hearing and Phonetic Sciences, University College London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Speech, Hearing and Phonetic Sciences, University College London, UK","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5057837548"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":null,"apc_paid":null,"fwci":0.3131,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.4809221,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"635","last_page":"639"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coarticulation","display_name":"Coarticulation","score":0.945015549659729},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.7920944690704346},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.768060564994812},{"id":"https://openalex.org/keywords/syllable","display_name":"Syllable","score":0.7026384472846985},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5713672637939453},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5491299629211426},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5348412394523621},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5112879276275635},{"id":"https://openalex.org/keywords/speech-production","display_name":"Speech production","score":0.43949174880981445},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.399813711643219},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32878339290618896},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.09632956981658936},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07698118686676025}],"concepts":[{"id":"https://openalex.org/C130727458","wikidata":"https://www.wikidata.org/wiki/Q1639109","display_name":"Coarticulation","level":3,"score":0.945015549659729},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.7920944690704346},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.768060564994812},{"id":"https://openalex.org/C109089402","wikidata":"https://www.wikidata.org/wiki/Q8188","display_name":"Syllable","level":2,"score":0.7026384472846985},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5713672637939453},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5491299629211426},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5348412394523621},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5112879276275635},{"id":"https://openalex.org/C43617652","wikidata":"https://www.wikidata.org/wiki/Q7575399","display_name":"Speech production","level":2,"score":0.43949174880981445},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.399813711643219},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32878339290618896},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.09632956981658936},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07698118686676025},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2022-10689","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10689","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10160011","is_oa":false,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10160011/","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"     In:  Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH 2022.  (pp. pp. 635-639).  ISCA (2022)     ","raw_type":"Proceedings paper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.800000011920929}],"awards":[{"id":"https://openalex.org/G1297994486","display_name":null,"funder_award_id":"RPG-2019-241","funder_id":"https://openalex.org/F4320319993","funder_display_name":"Leverhulme Trust"}],"funders":[{"id":"https://openalex.org/F4320319993","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1616590059","https://openalex.org/W1965378753","https://openalex.org/W1992544351","https://openalex.org/W2010188467","https://openalex.org/W2020944885","https://openalex.org/W2041110166","https://openalex.org/W2077494771","https://openalex.org/W2106411961","https://openalex.org/W2110095567","https://openalex.org/W2116086091","https://openalex.org/W2120282994","https://openalex.org/W2126289105","https://openalex.org/W2149411572","https://openalex.org/W2170503911","https://openalex.org/W2184270665","https://openalex.org/W2546861836","https://openalex.org/W2972552159","https://openalex.org/W3025683731","https://openalex.org/W3095560934","https://openalex.org/W3125043549","https://openalex.org/W3165674041","https://openalex.org/W3193311858","https://openalex.org/W4200041014","https://openalex.org/W4236211584","https://openalex.org/W4240065129","https://openalex.org/W4300903355","https://openalex.org/W4301823191"],"related_works":["https://openalex.org/W2047235756","https://openalex.org/W2355417428","https://openalex.org/W1890221585","https://openalex.org/W3304542","https://openalex.org/W196866866","https://openalex.org/W2119371555","https://openalex.org/W2391432493","https://openalex.org/W2063670285","https://openalex.org/W2169455968","https://openalex.org/W166167026"],"abstract_inverted_index":{"High-quality":[0],"articulatory":[1,21,60],"speech":[2,9],"synthesis":[3],"has":[4],"many":[5],"potential":[6],"applications":[7],"in":[8],"science":[10],"and":[11,25,54],"technology.":[12],"However,":[13],"developing":[14],"appropriate":[15],"mappings":[16,43],"from":[17],"linguistic":[18],"specification":[19],"to":[20,64],"gestures":[22,61],"is":[23],"difficult":[24],"time":[26],"consuming.":[27],"In":[28],"this":[29],"paper":[30],"we":[31],"construct":[32],"an":[33],"optimisation-based":[34],"framework":[35],"as":[36],"a":[37],"first":[38],"step":[39],"towards":[40],"learning":[41],"these":[42],"without":[44],"manual":[45],"intervention.":[46],"We":[47],"demonstrate":[48],"the":[49,56,59],"production":[50],"of":[51,58],"CCV":[52],"syllables":[53],"discuss":[55],"quality":[57],"with":[62],"reference":[63],"coarticulation.":[65]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
