{"id":"https://openalex.org/W2715071750","doi":"https://doi.org/10.1142/s021800141860008x","title":"LSTM Deep Neural Networks Postfiltering for Enhancing Synthetic Voices","display_name":"LSTM Deep Neural Networks Postfiltering for Enhancing Synthetic Voices","publication_year":2017,"publication_date":"2017-06-19","ids":{"openalex":"https://openalex.org/W2715071750","doi":"https://doi.org/10.1142/s021800141860008x","mag":"2715071750"},"language":"en","primary_location":{"id":"doi:10.1142/s021800141860008x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021800141860008x","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053058951","display_name":"Marvin Coto-Jim\u00e9nez","orcid":"https://orcid.org/0000-0002-6833-9938"},"institutions":[{"id":"https://openalex.org/I200362191","display_name":"Universidad Aut\u00f3noma Metropolitana","ror":"https://ror.org/02kta5139","country_code":"MX","type":"education","lineage":["https://openalex.org/I200362191"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Marvin Coto-Jim\u00e9nez","raw_affiliation_strings":["University of Costa Rica, San Jos\u00e9, Costa Rica and Metropolitan Autonomous University, Mexico D.F"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Costa Rica, San Jos\u00e9, Costa Rica and Metropolitan Autonomous University, Mexico D.F","institution_ids":["https://openalex.org/I200362191"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001627685","display_name":"John Goddard-Close","orcid":null},"institutions":[{"id":"https://openalex.org/I200362191","display_name":"Universidad Aut\u00f3noma Metropolitana","ror":"https://ror.org/02kta5139","country_code":"MX","type":"education","lineage":["https://openalex.org/I200362191"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"John Goddard-Close","raw_affiliation_strings":["Metropolitan Autonomous University, Mexico D.F"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Metropolitan Autonomous University, Mexico D.F","institution_ids":["https://openalex.org/I200362191"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.4784,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.91683513,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"32","issue":"01","first_page":"1860008","last_page":"1860008"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.8568565249443054},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8140063285827637},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6328726410865784},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5962942242622375},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5391533374786377},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5009329319000244},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.495096355676651},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.47787824273109436},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.4608561396598816},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4267333149909973}],"concepts":[{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.8568565249443054},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8140063285827637},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6328726410865784},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5962942242622375},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5391533374786377},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5009329319000244},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.495096355676651},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.47787824273109436},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.4608561396598816},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4267333149909973},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1142/s021800141860008x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021800141860008x","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:https://www.kerwa.ucr.ac.cr:10669/86283","is_oa":false,"landing_page_url":"https://www.worldscientific.com/doi/abs/10.1142/S021800141860008X","pdf_url":null,"source":{"id":"https://openalex.org/S4306400069","display_name":"Investigative News in Education (Universidad de Costa Rica)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I198243066","host_organization_name":"Universidad Nacional","host_organization_lineage":["https://openalex.org/I198243066"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence, vol.32(1), pp.1-24.","raw_type":"art\u00edculo cient\u00edfico"},{"id":"pmh:oai:kerwa.ucr.ac.cr:10669/86283","is_oa":false,"landing_page_url":"https://hdl.handle.net/10669/86283","pdf_url":null,"source":{"id":"https://openalex.org/S4306400069","display_name":"Investigative News in Education (Universidad de Costa Rica)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I198243066","host_organization_name":"Universidad Nacional","host_organization_lineage":["https://openalex.org/I198243066"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence, vol.32(1), pp.1-24.","raw_type":"art\u00edculo original"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321739","display_name":"Consejo Nacional de Ciencia y Tecnolog\u00eda","ror":"https://ror.org/059ex5q34"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W304834817","https://openalex.org/W950853366","https://openalex.org/W2036233992","https://openalex.org/W2064675550","https://openalex.org/W2163925746","https://openalex.org/W2332529255","https://openalex.org/W2967570265","https://openalex.org/W4285719527","https://openalex.org/W4300458848"],"related_works":["https://openalex.org/W2136763963","https://openalex.org/W2109705048","https://openalex.org/W2940588515","https://openalex.org/W1521297879","https://openalex.org/W2036150633","https://openalex.org/W3184123547","https://openalex.org/W1909151225","https://openalex.org/W2160030256","https://openalex.org/W2536059291","https://openalex.org/W4253235840"],"abstract_inverted_index":{"Recent":[0],"developments":[1],"in":[2,40,126,202],"speech":[3,11,128],"synthesis":[4,46],"have":[5],"produced":[6],"systems":[7],"capable":[8],"of":[9,36,54,82,93,114,145,153,178],"producing":[10],"which":[12,88,140,159,174],"closely":[13],"resembles":[14],"natural":[15,146],"speech,":[16,95],"and":[17,43,90,96,189],"researchers":[18],"now":[19],"strive":[20],"to":[21,57,60,63,101,103,137,143,165,170,193],"create":[22],"models":[23],"that":[24,206],"more":[25],"accurately":[26],"mimic":[27],"human":[28],"voices.":[29],"One":[30],"such":[31],"development":[32],"is":[33,53],"the":[34,80,83,168,203,217,221],"incorporation":[35],"multiple":[37],"linguistic":[38],"styles":[39],"various":[41],"languages":[42],"accents.":[44],"Speech":[45],"based":[47],"on":[48,220],"Hidden":[49],"Markov":[50],"Models":[51],"(HMM)":[52],"great":[55],"interest":[56],"researchers,":[58],"due":[59],"its":[61,74],"ability":[62],"produce":[64],"sophisticated":[65],"features":[66],"with":[67],"a":[68,123,134,162,171],"small":[69],"footprint.":[70],"Despite":[71],"some":[72],"progress,":[73],"quality":[75],"has":[76,98],"not":[77],"yet":[78],"reached":[79],"level":[81],"current":[84],"predominant":[85],"unit-selection":[86],"approaches,":[87],"select":[89],"concatenate":[91],"recordings":[92],"real":[94],"work":[97],"been":[99],"conducted":[100],"try":[102],"improve":[104],"HMM-based":[105,127,207],"systems.":[106],"In":[107],"this":[108,213],"paper,":[109],"we":[110],"present":[111],"an":[112],"application":[113],"long":[115],"short-term":[116],"memory":[117],"(LSTM)":[118],"deep":[119],"neural":[120],"networks":[121],"as":[122],"postfiltering":[124],"step":[125],"synthesis.":[129],"Our":[130],"motivation":[131],"stems":[132],"from":[133,161],"similar":[135],"desire":[136],"obtain":[138],"characteristics":[139],"are":[141,183,190],"closer":[142],"those":[144],"speech.":[147],"The":[148,180,199],"paper":[149,204],"analyzes":[150],"four":[151],"types":[152],"postfilters":[154,219],"obtained":[155],"using":[156,185,212],"five":[157],"voices,":[158],"range":[160],"single":[163],"postfilter":[164],"enhance":[166],"all":[167],"parameters,":[169],"multi-stream":[172,218],"proposal":[173],"separately":[175],"enhances":[176],"groups":[177],"parameters.":[179],"different":[181],"proposals":[182],"evaluated":[184],"three":[186],"objective":[187,223],"measures":[188],"statistically":[191],"compared":[192],"determine":[194],"any":[195],"significance":[196],"between":[197],"them.":[198],"results":[200],"described":[201],"indicate":[205],"voices":[208],"can":[209],"be":[210],"enhanced":[211],"approach,":[214],"specially":[215],"for":[216],"considered":[222],"measures.":[224]},"counts_by_year":[{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
