{"id":"https://openalex.org/W2032700328","doi":"https://doi.org/10.1109/iscslp.2014.6936610","title":"Frame correlation based autoregressive GMM method for voice conversion","display_name":"Frame correlation based autoregressive GMM method for voice conversion","publication_year":2014,"publication_date":"2014-09-01","ids":{"openalex":"https://openalex.org/W2032700328","doi":"https://doi.org/10.1109/iscslp.2014.6936610","mag":"2032700328"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2014.6936610","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2014.6936610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 9th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100425999","display_name":"Xian Li","orcid":"https://orcid.org/0000-0001-5714-3940"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xian Li","raw_affiliation_strings":["Dept. of Automation, University of Science and Technology of China, Hefei","National Engineering Laboratory of Speech and Language Information Processing, Hefei"],"affiliations":[{"raw_affiliation_string":"Dept. of Automation, University of Science and Technology of China, Hefei","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"National Engineering Laboratory of Speech and Language Information Processing, Hefei","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103123751","display_name":"Zengfu Wang","orcid":"https://orcid.org/0000-0003-1859-900X"},"institutions":[{"id":"https://openalex.org/I4210099079","display_name":"Institute of Intelligent Machines","ror":"https://ror.org/00w0qep84","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I2802624667","https://openalex.org/I4210099079"]},{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zeng-fu Wang","raw_affiliation_strings":["Chinese Academy of Sciences, Institute of Intelligent Machines, Hefei","Dept. of Automation, University of Science and Technology of China, Hefei","National Engineering Laboratory of Speech and Language Information Processing, Hefei"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Institute of Intelligent Machines, Hefei","institution_ids":["https://openalex.org/I4210099079"]},{"raw_affiliation_string":"Dept. of Automation, University of Science and Technology of China, Hefei","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"National Engineering Laboratory of Speech and Language Information Processing, Hefei","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100425999"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.409,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.73674556,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"221","last_page":"225"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.8271461129188538},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6771897077560425},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6299878358840942},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.6061854362487793},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5712724328041077},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.5432189702987671},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4896250367164612},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4783608317375183},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4642534852027893},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2265365719795227},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.14615580439567566}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.8271461129188538},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6771897077560425},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6299878358840942},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.6061854362487793},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5712724328041077},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.5432189702987671},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4896250367164612},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4783608317375183},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4642534852027893},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2265365719795227},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.14615580439567566},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp.2014.6936610","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2014.6936610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 9th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W95152782","https://openalex.org/W1491561031","https://openalex.org/W1973685422","https://openalex.org/W2005438552","https://openalex.org/W2024083195","https://openalex.org/W2049633694","https://openalex.org/W2116257577","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2131062138","https://openalex.org/W2143029619","https://openalex.org/W2156142001","https://openalex.org/W2943553228","https://openalex.org/W3129711340","https://openalex.org/W6603838645","https://openalex.org/W6681422213"],"related_works":["https://openalex.org/W2171218219","https://openalex.org/W1972271943","https://openalex.org/W2150410159","https://openalex.org/W4327525404","https://openalex.org/W4287185323","https://openalex.org/W3150905897","https://openalex.org/W1520183331","https://openalex.org/W2734842993","https://openalex.org/W2168175994","https://openalex.org/W2049473509"],"abstract_inverted_index":{"In":[0,15],"this":[1],"paper,":[2],"we":[3],"present":[4],"a":[5,55,69,76],"frame":[6,79],"correlation":[7,20,34,95],"based":[8],"autoregressive":[9,41],"GMM":[10],"method":[11,83,107],"for":[12,50,148],"voice":[13],"conversion.":[14],"our":[16],"system,":[17],"the":[18,22,32,51,66,73,105,121,129,139],"cross-frame":[19,33,94],"of":[21,35,68,75,116,133],"source":[23,70],"feature":[24,37,67],"is":[25,38,48,61,84,118,144],"modeled":[26,39],"with":[27,124],"augmented":[28],"delta":[29],"features,":[30],"and":[31,54,88,128],"target":[36,77,92],"by":[40,80,90],"models.":[42],"The":[43,100,111],"expectation":[44],"maximization":[45],"(EM)":[46],"algorithm":[47,60],"used":[49],"model":[52],"training,":[53],"maximum":[56],"likelihood":[57],"parameter":[58],"conversion":[59,89],"then":[62],"employed":[63],"to":[64,138],"convert":[65],"speaker":[71,78],"into":[72],"one":[74],"frame.":[81],"This":[82],"consistent":[85],"in":[86],"training":[87],"using":[91],"feature's":[93],"explicitly":[96],"at":[97],"both":[98],"stage.":[99],"experimental":[101],"results":[102,132],"show":[103],"that":[104],"proposed":[106],"has":[108],"excellent":[109],"performance.":[110],"test":[112],"set":[113],"log":[114],"probability":[115],"it":[117,134,143],"higher":[119],"than":[120],"GMM-DYN":[122,140],"(GMM":[123],"dynamic":[125],"features)":[126],"method,":[127],"subjective":[130],"evaluation":[131],"are":[135],"also":[136],"comparable":[137],"method.":[141],"Furthermore,":[142],"much":[145],"more":[146],"suitable":[147],"low-latency":[149],"application.":[150]},"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
