{"id":"https://openalex.org/W2130362963","doi":"https://doi.org/10.1109/icassp.2008.4518697","title":"On combining statistical methods and frequency warping for high-quality voice conversion","display_name":"On combining statistical methods and frequency warping for high-quality voice conversion","publication_year":2008,"publication_date":"2008-03-01","ids":{"openalex":"https://openalex.org/W2130362963","doi":"https://doi.org/10.1109/icassp.2008.4518697","mag":"2130362963"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2008.4518697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518697","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039550354","display_name":"Daniel Erro","orcid":null},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]},{"id":"https://openalex.org/I71999127","display_name":"Universitat de Barcelona","ror":"https://ror.org/021018s57","country_code":"ES","type":"education","lineage":["https://openalex.org/I71999127"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Daniel Erro","raw_affiliation_strings":["TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","TALP Res. Center, Politec. de Catalunya Univ., Barcelona"],"affiliations":[{"raw_affiliation_string":"TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]},{"raw_affiliation_string":"TALP Res. Center, Politec. de Catalunya Univ., Barcelona","institution_ids":["https://openalex.org/I71999127"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113462087","display_name":"Tatyana Poly\u00e1kova","orcid":null},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]},{"id":"https://openalex.org/I71999127","display_name":"Universitat de Barcelona","ror":"https://ror.org/021018s57","country_code":"ES","type":"education","lineage":["https://openalex.org/I71999127"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Tatyana Polyakova","raw_affiliation_strings":["TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","TALP Res. Center, Politec. de Catalunya Univ., Barcelona"],"affiliations":[{"raw_affiliation_string":"TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]},{"raw_affiliation_string":"TALP Res. Center, Politec. de Catalunya Univ., Barcelona","institution_ids":["https://openalex.org/I71999127"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103681962","display_name":"Asunci\u00f3n Moreno","orcid":null},"institutions":[{"id":"https://openalex.org/I71999127","display_name":"Universitat de Barcelona","ror":"https://ror.org/021018s57","country_code":"ES","type":"education","lineage":["https://openalex.org/I71999127"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Asuncion Moreno","raw_affiliation_strings":["TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","TALP Res. Center, Politec. de Catalunya Univ., Barcelona"],"affiliations":[{"raw_affiliation_string":"TALP Research Center, Universitat Polilt\u00e8cnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]},{"raw_affiliation_string":"TALP Res. Center, Politec. de Catalunya Univ., Barcelona","institution_ids":["https://openalex.org/I71999127"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5039550354"],"corresponding_institution_ids":["https://openalex.org/I71999127","https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":2.1043,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.8627685,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"4665","last_page":"4668"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7288208603858948},{"id":"https://openalex.org/keywords/dynamic-time-warping","display_name":"Dynamic time warping","score":0.7243671417236328},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6687105894088745},{"id":"https://openalex.org/keywords/image-warping","display_name":"Image warping","score":0.6673327684402466},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.665519654750824},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6415238976478577},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4873441159725189},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46481001377105713},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4157855808734894},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2317689061164856}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7288208603858948},{"id":"https://openalex.org/C88516994","wikidata":"https://www.wikidata.org/wiki/Q1268863","display_name":"Dynamic time warping","level":2,"score":0.7243671417236328},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6687105894088745},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.6673327684402466},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.665519654750824},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6415238976478577},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4873441159725189},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46481001377105713},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4157855808734894},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2317689061164856},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2008.4518697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518697","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W33533989","https://openalex.org/W152891837","https://openalex.org/W155193863","https://openalex.org/W1533098358","https://openalex.org/W1963778986","https://openalex.org/W2067234399","https://openalex.org/W2105698384","https://openalex.org/W2118850452","https://openalex.org/W2121387787","https://openalex.org/W2127167788","https://openalex.org/W2136166660","https://openalex.org/W2145130307","https://openalex.org/W2156142001","https://openalex.org/W2244925781","https://openalex.org/W2294205684","https://openalex.org/W2403171680","https://openalex.org/W6601370681","https://openalex.org/W6713031523","https://openalex.org/W6902064130"],"related_works":["https://openalex.org/W1670332068","https://openalex.org/W2095618524","https://openalex.org/W2735770592","https://openalex.org/W1971024059","https://openalex.org/W2347413598","https://openalex.org/W2330863229","https://openalex.org/W71572444","https://openalex.org/W1997383766","https://openalex.org/W2350336482","https://openalex.org/W2340348677"],"abstract_inverted_index":{"In":[0,63,93],"current":[1],"voice":[2,60,118],"conversion":[3,61],"systems,":[4,87],"obtaining":[5],"a":[6,15,43,58,81],"high":[7,16],"similarity":[8,50],"between":[9,48],"converted":[10],"and":[11,52,72,134],"target":[12],"voices":[13],"requires":[14],"degree":[17],"of":[18,99],"signal":[19],"manipulation,":[20],"which":[21],"implies":[22],"important":[23],"quality":[24,35,54,91],"degradation,":[25],"up":[26],"to":[27,79,89,111],"the":[28,34,49,53,113,125,130,141],"point":[29],"that":[30,69,140],"in":[31,109],"some":[32],"cases":[33],"scores":[36,51,55],"are":[37,104],"unacceptable":[38],"for":[39,116],"real-life":[40],"applications.":[41],"Indeed,":[42],"tradeoff":[44],"can":[45],"be":[46,77],"observed":[47],"achieved":[56],"by":[57,148],"given":[59],"system.":[62],"our":[64],"previous":[65],"works":[66],"we":[67],"proved":[68],"statistical":[70],"methods":[71],"frequency":[73],"warping":[74],"transformations":[75],"could":[76],"combined":[78],"yield":[80],"better":[82],"similarity-quality":[83],"balance":[84],"than":[85],"conventional":[86],"due":[88],"significant":[90],"improvements.":[92],"this":[94],"paper,":[95],"two":[96,102],"different":[97],"ways":[98],"combining":[100],"these":[101],"approaches":[103],"compared":[105],"through":[106],"perceptual":[107],"tests":[108],"order":[110],"determine":[112],"best":[114],"strategy":[115],"high-quality":[117],"conversion.":[119],"The":[120,137],"comparison":[121],"is":[122,146],"made":[123],"under":[124],"same":[126,131],"training":[127],"conditions,":[128],"using":[129],"speech":[132],"model":[133],"vector":[135],"dimensions.":[136],"results":[138],"indicate":[139],"Weighted":[142],"Frequency":[143],"Warping":[144],"method":[145],"preferred":[147],"listeners.":[149]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
