{"id":"https://openalex.org/W1555870626","doi":"https://doi.org/10.1109/icme.2015.7177437","title":"Sparse nonlinear representation for voice conversion","display_name":"Sparse nonlinear representation for voice conversion","publication_year":2015,"publication_date":"2015-06-01","ids":{"openalex":"https://openalex.org/W1555870626","doi":"https://doi.org/10.1109/icme.2015.7177437","mag":"1555870626"},"language":"en","primary_location":{"id":"doi:10.1109/icme.2015.7177437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme.2015.7177437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041887072","display_name":"Toru Nakashika","orcid":"https://orcid.org/0000-0003-1863-6771"},"institutions":[{"id":"https://openalex.org/I20529979","display_name":"University of Electro-Communications","ror":"https://ror.org/02x73b849","country_code":"JP","type":"education","lineage":["https://openalex.org/I20529979"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Toru Nakashika","raw_affiliation_strings":["University of Electro-Communications, Graduate School of Information Systems, Tokyo, Japan","University of Electro-Communications, Graduate School of Information Systems, 1-5-1 Chofugaoka, Chofu, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"University of Electro-Communications, Graduate School of Information Systems, Tokyo, Japan","institution_ids":["https://openalex.org/I20529979"]},{"raw_affiliation_string":"University of Electro-Communications, Graduate School of Information Systems, 1-5-1 Chofugaoka, Chofu, Tokyo, Japan","institution_ids":["https://openalex.org/I20529979"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009283470","display_name":"Tetsuya Takiguchi","orcid":"https://orcid.org/0000-0001-5005-7679"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuya Takiguchi","raw_affiliation_strings":["Kobe University, Graduate School of System Informatics, Kobe, Japan","Kobe University, Graduate School of System Informatics, 1-1 Rokkodai, Japan"],"affiliations":[{"raw_affiliation_string":"Kobe University, Graduate School of System Informatics, Kobe, Japan","institution_ids":["https://openalex.org/I65837984"]},{"raw_affiliation_string":"Kobe University, Graduate School of System Informatics, 1-1 Rokkodai, Japan","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040766342","display_name":"Yasuo Ariki","orcid":"https://orcid.org/0000-0003-3473-2026"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yasuo Ariki","raw_affiliation_strings":["Kobe University, Graduate School of System Informatics, Kobe, Japan","Kobe University, Graduate School of System Informatics, 1-1 Rokkodai, Japan"],"affiliations":[{"raw_affiliation_string":"Kobe University, Graduate School of System Informatics, Kobe, Japan","institution_ids":["https://openalex.org/I65837984"]},{"raw_affiliation_string":"Kobe University, Graduate School of System Informatics, 1-1 Rokkodai, Japan","institution_ids":["https://openalex.org/I65837984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5041887072"],"corresponding_institution_ids":["https://openalex.org/I20529979"],"apc_list":null,"apc_paid":null,"fwci":0.8629,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.81350779,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.8241778612136841},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7509913444519043},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.5689406991004944},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5651501417160034},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.562558114528656},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5409212708473206},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4921998083591461},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.4806055724620819},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47697529196739197},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.44683459401130676},{"id":"https://openalex.org/keywords/matching-pursuit","display_name":"Matching pursuit","score":0.440584659576416},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.44030192494392395},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3448994755744934},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.3183235228061676},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.13237252831459045}],"concepts":[{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.8241778612136841},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7509913444519043},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.5689406991004944},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5651501417160034},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.562558114528656},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5409212708473206},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4921998083591461},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.4806055724620819},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47697529196739197},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.44683459401130676},{"id":"https://openalex.org/C156872377","wikidata":"https://www.wikidata.org/wiki/Q6786281","display_name":"Matching pursuit","level":3,"score":0.440584659576416},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.44030192494392395},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3448994755744934},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3183235228061676},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.13237252831459045},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C124851039","wikidata":"https://www.wikidata.org/wiki/Q2665459","display_name":"Compressed sensing","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme.2015.7177437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme.2015.7177437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6000000238418579,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W10800834","https://openalex.org/W17772838","https://openalex.org/W49412823","https://openalex.org/W1517766716","https://openalex.org/W1950777589","https://openalex.org/W1963778986","https://openalex.org/W1965255698","https://openalex.org/W1972420736","https://openalex.org/W1993882792","https://openalex.org/W2017425464","https://openalex.org/W2020024436","https://openalex.org/W2022125261","https://openalex.org/W2105160541","https://openalex.org/W2118963448","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2126143605","https://openalex.org/W2131062138","https://openalex.org/W2133257461","https://openalex.org/W2135029798","https://openalex.org/W2136922672","https://openalex.org/W2136936677","https://openalex.org/W2139671364","https://openalex.org/W2156142001","https://openalex.org/W2158164339","https://openalex.org/W2161893161","https://openalex.org/W2165225968","https://openalex.org/W2294351487","https://openalex.org/W2296422624","https://openalex.org/W2296616510","https://openalex.org/W2398524192","https://openalex.org/W2401544731","https://openalex.org/W2401967023","https://openalex.org/W2407110532","https://openalex.org/W2577350056","https://openalex.org/W2913399920","https://openalex.org/W4244017338","https://openalex.org/W4250955649","https://openalex.org/W6631184128","https://openalex.org/W6679486525","https://openalex.org/W6679718588","https://openalex.org/W6680012447","https://openalex.org/W6680066585","https://openalex.org/W6683128514","https://openalex.org/W6683819664","https://openalex.org/W6697695168","https://openalex.org/W6732045268"],"related_works":["https://openalex.org/W2011611369","https://openalex.org/W4297791310","https://openalex.org/W4245251483","https://openalex.org/W1998873033","https://openalex.org/W2116148865","https://openalex.org/W4372266926","https://openalex.org/W2366556501","https://openalex.org/W2965458591","https://openalex.org/W1520740474","https://openalex.org/W4254934694"],"abstract_inverted_index":{"In":[0,22,98],"voice":[1,25,61],"conversion,":[2],"sparse-representation-based":[3,60],"methods":[4,63],"have":[5],"recently":[6],"been":[7],"garnering":[8],"attention":[9],"because":[10],"they":[11],"are,":[12],"relatively":[13],"speaking,":[14],"not":[15],"affected":[16],"by":[17,29],"over-fitting":[18],"or":[19],"over-smoothing":[20],"problems.":[21],"these":[23],"approaches,":[24],"conversion":[26,62],"is":[27,149],"achieved":[28],"estimating":[30],"a":[31,113,142],"sparse":[32,119,152],"vector":[33,52],"that":[34,74,90],"determines":[35],"which":[36,148],"dictionaries":[37,54,93,111],"of":[38,49,55,128],"the":[39,47,50,56,80,95,103,109,126,134],"target":[40],"speaker":[41],"should":[42],"be":[43,65],"used,":[44],"calculated":[45],"from":[46,94],"matching":[48],"input":[51],"and":[53,86,106,141],"source":[57],"speaker.":[58],"The":[59],"can":[64],"broadly":[66],"divided":[67],"into":[68],"two":[69],"approaches:":[70],"1)":[71],"an":[72,88],"approach":[73,89,105],"uses":[75],"raw":[76],"acoustic":[77],"features":[78],"in":[79],"training":[81,96],"data":[82],"as":[83],"parallel":[84,92,110],"dictionaries,":[85],"2)":[87],"trains":[91],"data.":[97],"our":[99,129],"approach,":[100,140,147],"we":[101,124],"follow":[102],"latter":[104],"systematically":[107],"estimate":[108],"using":[112],"joint-density":[114],"restricted":[115],"Boltzmann":[116],"machine":[117],"with":[118,133],"constraints.":[120],"Through":[121],"voice-conversion":[122],"experiments,":[123],"confirmed":[125],"high-performance":[127],"method,":[130],"comparing":[131],"it":[132],"conventional":[135],"Gaussian":[136],"mixture":[137],"model":[138],"(GMM)-based":[139],"non-negative":[143],"matrix":[144],"factorization":[145],"(NMF)-based":[146],"based":[150],"on":[151],"representation.":[153]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
