{"id":"https://openalex.org/W2733416080","doi":"https://doi.org/10.1109/taslp.2017.2723721","title":"An Exemplar-Based Approach to Frequency Warping for Voice Conversion","display_name":"An Exemplar-Based Approach to Frequency Warping for Voice Conversion","publication_year":2017,"publication_date":"2017-07-05","ids":{"openalex":"https://openalex.org/W2733416080","doi":"https://doi.org/10.1109/taslp.2017.2723721","mag":"2733416080"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2017.2723721","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2723721","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103156833","display_name":"Xiaohai Tian","orcid":"https://orcid.org/0000-0001-5219-1249"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Xiaohai Tian","raw_affiliation_strings":["School of Computer Science and Engineering, Joint NTU-UBC Research Centre of Excellence in Active Living for the Elderly, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Joint NTU-UBC Research Centre of Excellence in Active Living for the Elderly, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049491887","display_name":"Siu Wa Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Siu Wa Lee","raw_affiliation_strings":["Institute for Infocomm Research, A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, A*STAR, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102765381","display_name":"Zhizheng Wu","orcid":"https://orcid.org/0009-0001-1192-9857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhizheng Wu","raw_affiliation_strings":["Center for Speech Technology Research, University of Edinburgh, Edinburgh, U.K"],"affiliations":[{"raw_affiliation_string":"Center for Speech Technology Research, University of Edinburgh, Edinburgh, U.K","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070872826","display_name":"Eng Siong Chng","orcid":"https://orcid.org/0000-0001-6257-7399"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Eng Siong Chng","raw_affiliation_strings":["School of Computer Science and Engineering, Joint NTU-UBC Research Centre of Excellence in Active Living for the Elderly, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Joint NTU-UBC Research Centre of Excellence in Active Living for the Elderly, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103156833"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":5.4607,"has_fulltext":true,"cited_by_count":47,"citation_normalized_percentile":{"value":0.96572029,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"25","issue":"10","first_page":"1863","last_page":"1876"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-warping","display_name":"Image warping","score":0.8335701823234558},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7561630010604858},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7150148749351501},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.5045591592788696},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.43976402282714844},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42836907505989075},{"id":"https://openalex.org/keywords/dynamic-time-warping","display_name":"Dynamic time warping","score":0.41321098804473877},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37951964139938354},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32487744092941284},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1470622420310974}],"concepts":[{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.8335701823234558},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7561630010604858},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7150148749351501},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.5045591592788696},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.43976402282714844},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42836907505989075},{"id":"https://openalex.org/C88516994","wikidata":"https://www.wikidata.org/wiki/Q1268863","display_name":"Dynamic time warping","level":2,"score":0.41321098804473877},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37951964139938354},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32487744092941284},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1470622420310974},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2017.2723721","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2723721","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/89630","is_oa":false,"landing_page_url":"http://hdl.handle.net/10220/47103","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320320751","display_name":"Ministry of Education - Singapore","ror":"https://ror.org/01kcva023"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W49412823","https://openalex.org/W1497120562","https://openalex.org/W1524403222","https://openalex.org/W1536047166","https://openalex.org/W1539053441","https://openalex.org/W1588266896","https://openalex.org/W1599112982","https://openalex.org/W1963778986","https://openalex.org/W1972420736","https://openalex.org/W1977362459","https://openalex.org/W1999517677","https://openalex.org/W2005438552","https://openalex.org/W2009272428","https://openalex.org/W2017425464","https://openalex.org/W2020834817","https://openalex.org/W2049686551","https://openalex.org/W2055912867","https://openalex.org/W2060554399","https://openalex.org/W2072503712","https://openalex.org/W2086796102","https://openalex.org/W2105160541","https://openalex.org/W2110118271","https://openalex.org/W2110589840","https://openalex.org/W2111550316","https://openalex.org/W2120605154","https://openalex.org/W2120858595","https://openalex.org/W2121387787","https://openalex.org/W2123003832","https://openalex.org/W2126143605","https://openalex.org/W2128160875","https://openalex.org/W2135029798","https://openalex.org/W2136166660","https://openalex.org/W2141520175","https://openalex.org/W2143116775","https://openalex.org/W2150415460","https://openalex.org/W2153425803","https://openalex.org/W2156142001","https://openalex.org/W2156477760","https://openalex.org/W2160473997","https://openalex.org/W2165674530","https://openalex.org/W2169652224","https://openalex.org/W2177286092","https://openalex.org/W2179428711","https://openalex.org/W2244925781","https://openalex.org/W2292984643","https://openalex.org/W2294038178","https://openalex.org/W2294246205","https://openalex.org/W2402356521","https://openalex.org/W2406654659","https://openalex.org/W2408732577","https://openalex.org/W2475998840","https://openalex.org/W2577042574","https://openalex.org/W3124274650","https://openalex.org/W3143596294","https://openalex.org/W6602007935","https://openalex.org/W6632201099","https://openalex.org/W6635216677","https://openalex.org/W6635678660","https://openalex.org/W6676465519","https://openalex.org/W6680012447","https://openalex.org/W6697024540","https://openalex.org/W6697270646","https://openalex.org/W6732251480","https://openalex.org/W6902064130"],"related_works":["https://openalex.org/W1670332068","https://openalex.org/W2095618524","https://openalex.org/W2735770592","https://openalex.org/W2347413598","https://openalex.org/W2330863229","https://openalex.org/W71572444","https://openalex.org/W1997383766","https://openalex.org/W2350336482","https://openalex.org/W2340348677","https://openalex.org/W2130799169"],"abstract_inverted_index":{"The":[0,77],"voice":[1,10,42,55,151],"conversion's":[2],"task":[3],"is":[4,22,80,98],"to":[5,11,33,73],"modify":[6],"a":[7,16,40,83,87,102,156],"source":[8],"speaker's":[9],"sound":[12],"like":[13],"that":[14],"of":[15,89,106,148],"target":[17,35],"speaker.":[18,36],"A":[19],"conversion":[20,43,63,125,134,152],"method":[21,53,58],"considered":[23],"successful":[24],"when":[25],"the":[26,34,70,75,94,112,124,133,142,146,149,163],"produced":[27],"speech":[28,160],"sounds":[29],"natural":[30],"and":[31,51,138],"similar":[32],"This":[37],"paper":[38],"presents":[39],"new":[41],"framework":[44],"in":[45,159],"which":[46],"we":[47,108,127],"combine":[48],"frequency":[49,67],"warping":[50,68,78,91,96],"exemplar-based":[52],"for":[54,123],"conversion.":[56],"Our":[57],"maintains":[59],"high-resolution":[60,71],"details":[61],"during":[62],"by":[64,82],"directly":[65],"applying":[66],"on":[69,101,141],"spectrum":[72],"represent":[74],"target.":[76],"function":[79,97],"generated":[81,95],"sparse":[84],"interpolation":[85],"from":[86,117],"dictionary":[88],"exemplar":[90],"functions.":[92],"As":[93],"dependent":[99],"only":[100],"very":[103],"small":[104],"set":[105],"exemplars,":[107],"do":[109],"away":[110],"with":[111],"statistical":[113],"averaging":[114],"effects":[115],"inherited":[116],"Gaussian":[118],"mixture":[119],"models.":[120],"To":[121],"compensate":[122],"error,":[126],"also":[128],"apply":[129],"residual":[130],"exemplars":[131],"into":[132],"process.":[135],"Both":[136],"objective":[137],"subjective":[139],"evaluations":[140],"VOICES":[143],"database":[144],"validated":[145],"effectiveness":[147],"proposed":[150],"framework.":[153],"We":[154],"observed":[155],"significant":[157],"improvement":[158],"quality":[161],"over":[162],"state-of-the-art":[164],"parametric":[165],"methods.":[166]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":13},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
