{"id":"https://openalex.org/W3196942063","doi":"https://doi.org/10.21437/interspeech.2021-1422","title":"Model-Based Exploration of Linking Between Vowel Articulatory Space and Acoustic Space","display_name":"Model-Based Exploration of Linking Between Vowel Articulatory Space and Acoustic Space","publication_year":2021,"publication_date":"2021-08-27","ids":{"openalex":"https://openalex.org/W3196942063","doi":"https://doi.org/10.21437/interspeech.2021-1422","mag":"3196942063"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2021-1422","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://discovery.ucl.ac.uk/10139361/1/xu21j_interspeech.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022797639","display_name":"Anqi Xu","orcid":"https://orcid.org/0000-0002-4331-6676"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anqi Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057837548","display_name":"Daniel van Niekerk","orcid":"https://orcid.org/0000-0002-7324-2751"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daniel van Niekerk","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001239900","display_name":"Branislav Gerazov","orcid":"https://orcid.org/0000-0003-2498-6831"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Branislav Gerazov","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004916681","display_name":"Paul Konstantin Krug","orcid":"https://orcid.org/0000-0001-8518-8142"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Paul Konstantin Krug","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003455071","display_name":"Santitham Prom\u2013on","orcid":"https://orcid.org/0000-0002-0869-089X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Santitham Prom-on","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046141664","display_name":"Peter Birkholz","orcid":"https://orcid.org/0000-0003-0167-8123"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peter Birkholz","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049702508","display_name":"Yi Xu","orcid":"https://orcid.org/0000-0002-8541-2658"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1376479,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3191","last_page":"3195"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.7800557613372803},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.7192445993423462},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6400043964385986},{"id":"https://openalex.org/keywords/acoustic-space","display_name":"Acoustic space","score":0.6315439343452454},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5948392748832703},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.5528454780578613},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.15672150254249573},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.15642660856246948}],"concepts":[{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.7800557613372803},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.7192445993423462},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6400043964385986},{"id":"https://openalex.org/C108250783","wikidata":"https://www.wikidata.org/wiki/Q4674710","display_name":"Acoustic space","level":3,"score":0.6315439343452454},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5948392748832703},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.5528454780578613},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.15672150254249573},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.15642660856246948},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2021-1422","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10139361","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10139361/","pdf_url":"https://discovery.ucl.ac.uk/10139361/1/xu21j_interspeech.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"     In:  Proceedings of the Annual Conference of the International Speech Communication Association: INTERSPEECH 2021.  (pp. pp. 3191-3195).  ISCA: Brno, Czechia. (2021)     ","raw_type":"Proceedings paper"}],"best_oa_location":{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10139361","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10139361/","pdf_url":"https://discovery.ucl.ac.uk/10139361/1/xu21j_interspeech.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"     In:  Proceedings of the Annual Conference of the International Speech Communication Association: INTERSPEECH 2021.  (pp. pp. 3191-3195).  ISCA: Brno, Czechia. (2021)     ","raw_type":"Proceedings paper"},"sustainable_development_goals":[{"score":0.7099999785423279,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1297994486","display_name":null,"funder_award_id":"RPG-2019-241","funder_id":"https://openalex.org/F4320319993","funder_display_name":"Leverhulme Trust"}],"funders":[{"id":"https://openalex.org/F4320319993","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3196942063.pdf","grobid_xml":"https://content.openalex.org/works/W3196942063.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W34090632","https://openalex.org/W46188241","https://openalex.org/W51888096","https://openalex.org/W1965378753","https://openalex.org/W1975752122","https://openalex.org/W1976587578","https://openalex.org/W1978396169","https://openalex.org/W1981258758","https://openalex.org/W1986221083","https://openalex.org/W1991482046","https://openalex.org/W2001312679","https://openalex.org/W2006775235","https://openalex.org/W2024060531","https://openalex.org/W2057417891","https://openalex.org/W2123778414","https://openalex.org/W2150290224","https://openalex.org/W2153533342","https://openalex.org/W2765553634","https://openalex.org/W2793593753","https://openalex.org/W2999126891","https://openalex.org/W3095560934","https://openalex.org/W4233131682","https://openalex.org/W4245923654","https://openalex.org/W4250530039"],"related_works":["https://openalex.org/W4238901050","https://openalex.org/W2027410645","https://openalex.org/W2065525630","https://openalex.org/W2746534923","https://openalex.org/W2004830549","https://openalex.org/W2090246781","https://openalex.org/W2025869674","https://openalex.org/W1974239872","https://openalex.org/W2272271754","https://openalex.org/W2153533342"],"abstract_inverted_index":{"While":[0],"the":[1,16,36,39,43,97,119,127,134],"acoustic":[2,121],"vowel":[3],"space":[4,19,53],"has":[5],"been":[6],"extensively":[7],"studied":[8],"in":[9],"previous":[10],"research,":[11],"little":[12],"is":[13,109],"known":[14],"about":[15],"high-dimensional":[17],"articulatory":[18,23,52,59,81,101,114],"of":[20,38,113,129],"vowels.":[21,66],"The":[22,83],"imaging":[24],"techniques":[25],"are":[26,96],"limited":[27],"to":[28,48,61,72,132],"tracking":[29],"only":[30],"a":[31,50,57,110],"few":[32],"key":[33],"articulators,":[34],"leaving":[35],"rest":[37],"articulators":[40],"unmonitored.":[41],"In":[42],"present":[44],"study,":[45],"we":[46],"attempted":[47],"develop":[49],"detailed":[51],"obtained":[54],"by":[55],"training":[56],"3D":[58],"synthesizer":[60],"learn":[62],"eleven":[63],"British":[64],"English":[65],"An":[67],"analysis-by-synthesis":[68],"strategy":[69],"was":[70],"used":[71],"acoustically":[73],"optimize":[74],"vocal":[75],"tract":[76],"parameters":[77],"that":[78,86],"represent":[79],"twenty":[80],"dimensions.":[82,102],"results":[84],"show":[85],"tongue":[87],"height":[88],"and":[89,93,139],"retraction,":[90],"larynx":[91],"location":[92],"lip":[94],"roundness":[95],"most":[98],"perceptually":[99],"distinctive":[100],"Yet,":[103],"even":[104],"for":[105],"these":[106],"dimensions,":[107],"there":[108],"fair":[111],"amount":[112],"overlap":[115],"between":[116,136],"vowels,":[117],"unlike":[118],"fine-grained":[120],"space.":[122],"This":[123],"method":[124],"opens":[125],"up":[126],"possibility":[128],"using":[130],"modelling":[131],"investigate":[133],"link":[135],"speech":[137],"production":[138],"perception.":[140]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
