{"id":"https://openalex.org/W2775672830","doi":"https://doi.org/10.1109/waspaa.2017.8170049","title":"Voice conversion based on a mixture density network","display_name":"Voice conversion based on a mixture density network","publication_year":2017,"publication_date":"2017-10-01","ids":{"openalex":"https://openalex.org/W2775672830","doi":"https://doi.org/10.1109/waspaa.2017.8170049","mag":"2775672830"},"language":"en","primary_location":{"id":"doi:10.1109/waspaa.2017.8170049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa.2017.8170049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017220021","display_name":"Mohsen Ahangar","orcid":null},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mohsen Ahangar","raw_affiliation_strings":["School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056598606","display_name":"Mostafa Ghorbandoost","orcid":null},"institutions":[{"id":"https://openalex.org/I158248296","display_name":"Amirkabir University of Technology","ror":"https://ror.org/04gzbav43","country_code":"IR","type":"education","lineage":["https://openalex.org/I158248296"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Mostafa Ghorbandoost","raw_affiliation_strings":["School of Electrical Engineering, Amirkabir University of Technology, Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Amirkabir University of Technology, Tehran, Iran","institution_ids":["https://openalex.org/I158248296"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068330021","display_name":"Sudhendu Raj Sharma","orcid":"https://orcid.org/0000-0003-1996-673X"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sudhendu Sharma","raw_affiliation_strings":["School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103578281","display_name":"M.J.T. Smith","orcid":null},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark J. T. Smith","raw_affiliation_strings":["School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5017220021"],"corresponding_institution_ids":["https://openalex.org/I219193219"],"apc_list":null,"apc_paid":null,"fwci":0.9751,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.82789231,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"128","issue":null,"first_page":"329","last_page":"333"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.8813139796257019},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6237677335739136},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6023896336555481},{"id":"https://openalex.org/keywords/expectation\u2013maximization-algorithm","display_name":"Expectation\u2013maximization algorithm","score":0.5406839847564697},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5253122448921204},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.49930667877197266},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.47828277945518494},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4697715938091278},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.4645023047924042},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4592594504356384},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44665804505348206},{"id":"https://openalex.org/keywords/mixture-distribution","display_name":"Mixture distribution","score":0.4295696020126343},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4114045798778534},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.381011962890625},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2503824234008789},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.23389378190040588},{"id":"https://openalex.org/keywords/probability-density-function","display_name":"Probability density function","score":0.18374192714691162},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.14511099457740784},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06804093718528748},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.06571197509765625}],"concepts":[{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.8813139796257019},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6237677335739136},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6023896336555481},{"id":"https://openalex.org/C182081679","wikidata":"https://www.wikidata.org/wiki/Q1275153","display_name":"Expectation\u2013maximization algorithm","level":3,"score":0.5406839847564697},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5253122448921204},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.49930667877197266},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.47828277945518494},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4697715938091278},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.4645023047924042},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4592594504356384},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44665804505348206},{"id":"https://openalex.org/C56672385","wikidata":"https://www.wikidata.org/wiki/Q17157111","display_name":"Mixture distribution","level":3,"score":0.4295696020126343},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4114045798778534},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.381011962890625},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2503824234008789},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.23389378190040588},{"id":"https://openalex.org/C197055811","wikidata":"https://www.wikidata.org/wiki/Q207522","display_name":"Probability density function","level":2,"score":0.18374192714691162},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.14511099457740784},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06804093718528748},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.06571197509765625},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/waspaa.2017.8170049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa.2017.8170049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1579853615","https://openalex.org/W1601795611","https://openalex.org/W1663973292","https://openalex.org/W1968689546","https://openalex.org/W1981556389","https://openalex.org/W1982854652","https://openalex.org/W2018932587","https://openalex.org/W2049686551","https://openalex.org/W2116257577","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2126143605","https://openalex.org/W2128466129","https://openalex.org/W2139627492","https://openalex.org/W2296704011","https://openalex.org/W3143522270","https://openalex.org/W3177989406","https://openalex.org/W6629510986","https://openalex.org/W6634817459","https://openalex.org/W6697285287","https://openalex.org/W6798679566"],"related_works":["https://openalex.org/W2198732287","https://openalex.org/W4287816759","https://openalex.org/W2803473765","https://openalex.org/W2372918136","https://openalex.org/W2153481672","https://openalex.org/W2105786884","https://openalex.org/W2128540811","https://openalex.org/W1658960529","https://openalex.org/W4293056332","https://openalex.org/W4312864369"],"abstract_inverted_index":{"This":[0,52],"paper":[1],"presents":[2],"a":[3,11,21,86],"new":[4],"voice":[5],"conversion":[6],"(VC)":[7],"algorithm":[8],"based":[9],"on":[10],"Mixture":[12,23],"Density":[13,107],"Network":[14,30],"(MDN).":[15],"MDN":[16,56,74,80,100],"is":[17],"the":[18,33,36,42,47,55,68,73,79,98,115,119],"combination":[19],"of":[20,35,46,125],"Gaussian":[22],"Model":[24],"(GMM)":[25],"and":[26,105,121,128],"an":[27],"Artificial":[28],"Neural":[29],"(ANN),":[31],"where":[32],"parameters":[34,59],"GMM":[37,58,108],"are":[38],"estimated":[39],"by":[40],"using":[41],"ANN":[43],"method":[44,101,117],"instead":[45],"Expectation":[48],"Maximization":[49],"(EM)":[50],"algorithm.":[51],"characteristic":[53],"helps":[54],"estimate":[57],"more":[60],"accurately,":[61],"which":[62],"results":[63,93],"in":[64,67,123],"lower":[65],"distortion":[66],"converted":[69],"speech.":[70],"To":[71],"apply":[72],"to":[75],"VC,":[76],"we":[77],"combine":[78],"with":[81,103],"Maximum":[82],"Likelihood":[83],"Estimation,":[84],"employing":[85],"Global":[87],"Variance":[88],"modification":[89],"(MLE-GV)":[90],"method.":[91],"Objective":[92],"show":[94],"better":[95],"performance":[96],"for":[97],"proposed":[99,116],"compared":[102],"MLE":[104],"Joint":[106],"(JDGMM)":[109],"methods.":[110],"Subjective":[111],"experiments":[112],"demonstrate":[113],"that":[114],"outperforms":[118],"MLE-GV":[120],"JDGMM-GV":[122],"terms":[124],"speech":[126],"quality":[127],"speaker":[129],"individuality.":[130]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
