{"id":"https://openalex.org/W1971596446","doi":"https://doi.org/10.1109/icassp.2013.6639213","title":"Articulatory inversion and synthesis: Towards articulatory-based modification of speech","display_name":"Articulatory inversion and synthesis: Towards articulatory-based modification of speech","publication_year":2013,"publication_date":"2013-05-01","ids":{"openalex":"https://openalex.org/W1971596446","doi":"https://doi.org/10.1109/icassp.2013.6639213","mag":"1971596446"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2013.6639213","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639213","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Sandesh Aryal","orcid":null},"institutions":[{"id":"https://openalex.org/I58152225","display_name":"Texas A&M University at Qatar","ror":"https://ror.org/03vb4dm14","country_code":"QA","type":"education","lineage":["https://openalex.org/I58152225","https://openalex.org/I91045830"]},{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["QA","US"],"is_corresponding":false,"raw_author_name":"Sandesh Aryal","raw_affiliation_strings":["Department of Computer Science and Engineering, Texas A and M University, Qatar","Department of Computer Science and Engineering, Texas A&M University , College Station, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Texas A and M University, Qatar","institution_ids":["https://openalex.org/I58152225"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Texas A&M University , College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062423099","display_name":"Ricardo Guti\u00e9rrez\u2010Osuna","orcid":"https://orcid.org/0000-0003-2817-2085"},"institutions":[{"id":"https://openalex.org/I58152225","display_name":"Texas A&M University at Qatar","ror":"https://ror.org/03vb4dm14","country_code":"QA","type":"education","lineage":["https://openalex.org/I58152225","https://openalex.org/I91045830"]},{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["QA","US"],"is_corresponding":false,"raw_author_name":"Ricardo Gutierrez-Osuna","raw_affiliation_strings":["Department of Computer Science and Engineering, Texas A and M University, Qatar","Department of Computer Science and Engineering, Texas A&M University , College Station, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Texas A and M University, Qatar","institution_ids":["https://openalex.org/I58152225"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Texas A&M University , College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.9648,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.91319374,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"7952","last_page":"7956"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.6400498747825623},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6273418664932251},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6137155294418335},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5524652004241943},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.40336188673973083}],"concepts":[{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.6400498747825623},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6273418664932251},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6137155294418335},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5524652004241943},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.40336188673973083},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C109007969","wikidata":"https://www.wikidata.org/wiki/Q749565","display_name":"Structural basin","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2013.6639213","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639213","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.44999998807907104,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W117449184","https://openalex.org/W190138384","https://openalex.org/W1543471089","https://openalex.org/W1857273500","https://openalex.org/W1926768285","https://openalex.org/W1972620250","https://openalex.org/W1982854652","https://openalex.org/W1986174057","https://openalex.org/W1987297220","https://openalex.org/W2017742648","https://openalex.org/W2023728986","https://openalex.org/W2041110166","https://openalex.org/W2102152293","https://openalex.org/W2120605154","https://openalex.org/W2128446656","https://openalex.org/W2129321698","https://openalex.org/W2135707066","https://openalex.org/W2144602675","https://openalex.org/W2147462851","https://openalex.org/W2168858784","https://openalex.org/W2172028426","https://openalex.org/W2400063444","https://openalex.org/W2984826864","https://openalex.org/W6607831622","https://openalex.org/W6712610176"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880","https://openalex.org/W1596801655"],"abstract_inverted_index":{"Certain":[0],"speech":[1,142],"modifications,":[2],"such":[3],"as":[4,88],"changes":[5],"in":[6,16,21,56,144],"foreign/regional":[7],"accents":[8],"or":[9],"articulatory":[10,18,30,57,66,146],"styles,":[11],"are":[12,54],"performed":[13],"more":[14],"effectively":[15],"the":[17,22,44,99,107,138,145],"domain":[19,147],"than":[20],"acoustic":[23],"domain.":[24],"Though":[25],"measuring":[26],"articulators":[27,50,72,84,103,129],"is":[28],"cumbersome,":[29],"parameters":[31],"may":[32],"be":[33],"estimated":[34],"from":[35,52],"acoustics":[36,53],"through":[37,90,148],"inversion.":[38,149],"In":[39],"this":[40,60],"paper,":[41],"we":[42,62],"study":[43],"impact":[45],"on":[46],"synthesis":[47,86,117,133],"quality":[48,118],"when":[49],"predicted":[51,73,102],"used":[55],"synthesis.":[58],"For":[59],"purpose,":[61],"trained":[63],"a":[64],"GMM":[65],"synthesizer":[67,100],"and":[68,94,135],"drove":[69],"it":[70],"with":[71,74,101],"an":[75],"RBF-based":[76],"inversion":[77,113],"model.":[78],"Using":[79],"inverted":[80,128],"instead":[81],"of":[82,109,140],"measured":[83,89,122],"degraded":[85],"quality,":[87,134],"Mel":[91],"cepstral":[92],"distortion":[93],"subjective":[95],"tests.":[96],"However,":[97],"retraining":[98],"not":[104,131],"only":[105],"reversed":[106],"effect":[108],"errors":[110],"introduced":[111],"during":[112],"but":[114],"also":[115],"improved":[116],"relative":[119],"to":[120],"using":[121],"articulators.":[123],"These":[124],"results":[125],"suggest":[126],"that":[127],"do":[130],"compromise":[132],"open":[136],"up":[137],"possibility":[139],"performing":[141],"modification":[143]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
