{"id":"https://openalex.org/W2995021324","doi":"https://doi.org/10.1145/3368926.3369662","title":"Emotional Speech Generator by using Generative Adversarial Networks","display_name":"Emotional Speech Generator by using Generative Adversarial Networks","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2995021324","doi":"https://doi.org/10.1145/3368926.3369662","mag":"2995021324"},"language":"en","primary_location":{"id":"doi:10.1145/3368926.3369662","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3368926.3369662","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Tenth International Symposium on Information and Communication Technology  - SoICT 2019","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040327114","display_name":"Takuya Asakura","orcid":null},"institutions":[{"id":"https://openalex.org/I52706244","display_name":"College of Industrial Technology","ror":"https://ror.org/054a9s036","country_code":"JP","type":"education","lineage":["https://openalex.org/I52706244"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Takuya Asakura","raw_affiliation_strings":["Advanced course of Electronics, Tokyo Metropolitan College of Industrial Technology, Arakawa-ward, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Advanced course of Electronics, Tokyo Metropolitan College of Industrial Technology, Arakawa-ward, Tokyo, Japan","institution_ids":["https://openalex.org/I52706244"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006007483","display_name":"Shunsuke Akama","orcid":null},"institutions":[{"id":"https://openalex.org/I52706244","display_name":"College of Industrial Technology","ror":"https://ror.org/054a9s036","country_code":"JP","type":"education","lineage":["https://openalex.org/I52706244"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shunsuke Akama","raw_affiliation_strings":["Advanced course of Electronics Tokyo Metropolitan College of Industrial Technology Arakawa-ward, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Advanced course of Electronics Tokyo Metropolitan College of Industrial Technology Arakawa-ward, Tokyo, Japan","institution_ids":["https://openalex.org/I52706244"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040244392","display_name":"Eri Sato-Shimokawara","orcid":"https://orcid.org/0000-0002-4189-9724"},"institutions":[{"id":"https://openalex.org/I69740276","display_name":"Tokyo Metropolitan University","ror":"https://ror.org/00ws30h19","country_code":"JP","type":"education","lineage":["https://openalex.org/I69740276"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Eri Shimokawara","raw_affiliation_strings":["Graduate school of Information Science, Tokyo Metropolitan University Hino-city, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate school of Information Science, Tokyo Metropolitan University Hino-city, Tokyo, Japan","institution_ids":["https://openalex.org/I69740276"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056005443","display_name":"Toru Yamaguchi","orcid":"https://orcid.org/0000-0002-7183-7209"},"institutions":[{"id":"https://openalex.org/I69740276","display_name":"Tokyo Metropolitan University","ror":"https://ror.org/00ws30h19","country_code":"JP","type":"education","lineage":["https://openalex.org/I69740276"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Toru Yamaguchi","raw_affiliation_strings":["Graduate school of Information Science, Tokyo Metropolitan University Hino-city, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate school of Information Science, Tokyo Metropolitan University Hino-city, Tokyo, Japan","institution_ids":["https://openalex.org/I69740276"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101445428","display_name":"Shoji Yamamoto","orcid":"https://orcid.org/0000-0003-2112-8612"},"institutions":[{"id":"https://openalex.org/I52706244","display_name":"College of Industrial Technology","ror":"https://ror.org/054a9s036","country_code":"JP","type":"education","lineage":["https://openalex.org/I52706244"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shoji Yamamoto","raw_affiliation_strings":["Advanced course of Electronics, Tokyo Metropolitan College of Industrial Technology Arakawa-ward, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Advanced course of Electronics, Tokyo Metropolitan College of Industrial Technology Arakawa-ward, Tokyo, Japan","institution_ids":["https://openalex.org/I52706244"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5040327114"],"corresponding_institution_ids":["https://openalex.org/I52706244"],"apc_list":null,"apc_paid":null,"fwci":0.5027,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.65076266,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"9","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.8236289024353027},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.7302618622779846},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.701364278793335},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6777614951133728},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5075427293777466},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37744230031967163},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3621801733970642}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.8236289024353027},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.7302618622779846},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.701364278793335},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6777614951133728},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5075427293777466},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37744230031967163},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3621801733970642},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3368926.3369662","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3368926.3369662","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Tenth International Symposium on Information and Communication Technology  - SoICT 2019","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7099999785423279,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2099471712","https://openalex.org/W2123771434","https://openalex.org/W2146334809","https://openalex.org/W2194775991","https://openalex.org/W2471520273","https://openalex.org/W2476548250","https://openalex.org/W2567070169","https://openalex.org/W2603777577","https://openalex.org/W2769810959","https://openalex.org/W2774848319","https://openalex.org/W2777302760","https://openalex.org/W2805669069","https://openalex.org/W2902070858","https://openalex.org/W2951697117","https://openalex.org/W2962793481","https://openalex.org/W2963970792","https://openalex.org/W4250482878","https://openalex.org/W4294619240"],"related_works":["https://openalex.org/W3005996785","https://openalex.org/W3107474891","https://openalex.org/W4289303600","https://openalex.org/W3024390022","https://openalex.org/W4288624664","https://openalex.org/W2476099471","https://openalex.org/W2914998939","https://openalex.org/W3156291593","https://openalex.org/W2561036008","https://openalex.org/W2900055988"],"abstract_inverted_index":{"In":[0,59],"this":[1,60],"paper,":[2],"we":[3,43,84,122],"propose":[4],"an":[5,13,40,67,74,138],"affective":[6],"voice":[7],"conversion":[8],"method":[9,27,158],"that":[10],"can":[11],"generate":[12],"emotional":[14,119,141],"phonation":[15],"from":[16,36],"neutral":[17],"speech":[18,37,117],"by":[19,132],"using":[20,133],"cycle-consistent":[21],"generative":[22],"adversarial":[23],"networks":[24],"(CycleGAN).":[25],"Our":[26],"uses":[28],"the":[29,45,63,80,90,97,100,107,115,124,134,144,152,163,166],"Mel-cepstral":[30],"coefficients":[31],"(MCEPs),":[32],"which":[33,49],"are":[34],"extracted":[35],"signal":[38],"as":[39],"input.":[41],"Next,":[42],"apply":[44],"modified":[46],"network":[47],"model":[48],"is":[50,71,111,148],"comprised":[51],"two":[52,86],"components":[53],"with":[54,66,118],"a":[55,93,103],"generator":[56,61],"and":[57,69,76,99,127],"discriminator.":[58],"network,":[62],"pairing":[64],"structure":[65],"encoder":[68,95,105],"decoder":[70],"used":[72],"for":[73,96,106,137],"accurate":[75],"fast":[77],"calculation":[78],"in":[79],"learning":[81],"process.":[82],"Furthermore,":[83],"construct":[85],"types":[87],"of":[88,130,140,154,165],"encoder;":[89],"one":[91],"equips":[92,102],"content":[94],"linguistic-information,":[98],"other":[101],"domain":[104],"emotional-information.":[108],"This":[109],"separation":[110],"enable":[112],"to":[113,150,161],"reproduce":[114],"smooth":[116],"information.":[120],"Finally,":[121],"evaluate":[123],"emotion":[125,164],"expression":[126],"sound":[128,155],"quality":[129],"speeches":[131],"subjective":[135],"evaluation":[136],"accuracy":[139],"change.":[142],"As":[143],"result,":[145],"although":[146],"it":[147],"necessary":[149],"improve":[151],"deterioration":[153],"quality,":[156],"our":[157],"has":[159],"accomplished":[160],"convert":[162],"speech.":[167]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
