{"id":"https://openalex.org/W2892237921","doi":"https://doi.org/10.1109/iwobi.2018.8464204","title":"Pre-training Long Short-term Memory Neural Networks for Efficient Regression in Artificial Speech Postfiltering","display_name":"Pre-training Long Short-term Memory Neural Networks for Efficient Regression in Artificial Speech Postfiltering","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2892237921","doi":"https://doi.org/10.1109/iwobi.2018.8464204","mag":"2892237921"},"language":"en","primary_location":{"id":"doi:10.1109/iwobi.2018.8464204","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwobi.2018.8464204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Work Conference on Bioinspired Intelligence (IWOBI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053058951","display_name":"Marvin Coto-Jim\u00e9nez","orcid":"https://orcid.org/0000-0002-6833-9938"},"institutions":[{"id":"https://openalex.org/I31944674","display_name":"Universidad de Costa Rica","ror":"https://ror.org/02yzgww51","country_code":"CR","type":"education","lineage":["https://openalex.org/I31944674"]}],"countries":["CR"],"is_corresponding":true,"raw_author_name":"Marvin Coto-Jimenez","raw_affiliation_strings":["Escuela de Ingenier\u00e1a El\u00e9ctrica, Universidad de Costa Rica, San Jose, Costa Rica"],"affiliations":[{"raw_affiliation_string":"Escuela de Ingenier\u00e1a El\u00e9ctrica, Universidad de Costa Rica, San Jose, Costa Rica","institution_ids":["https://openalex.org/I31944674"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5053058951"],"corresponding_institution_ids":["https://openalex.org/I31944674"],"apc_list":null,"apc_paid":null,"fwci":0.5062,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.74249942,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8415968418121338},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.7309518456459045},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6612532734870911},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6360983848571777},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5920326113700867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5873517394065857},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5516543984413147},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.5048390030860901},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4209061861038208},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.41432619094848633},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.3433871269226074},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.333820641040802}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8415968418121338},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.7309518456459045},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6612532734870911},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6360983848571777},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5920326113700867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5873517394065857},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5516543984413147},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.5048390030860901},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4209061861038208},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41432619094848633},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.3433871269226074},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.333820641040802},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iwobi.2018.8464204","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwobi.2018.8464204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Work Conference on Bioinspired Intelligence (IWOBI)","raw_type":"proceedings-article"},{"id":"pmh:oai:https://www.kerwa.ucr.ac.cr:10669/86291","is_oa":false,"landing_page_url":"https://ieeexplore.ieee.org/document/8464204","pdf_url":null,"source":{"id":"https://openalex.org/S4306400069","display_name":"Investigative News in Education (Universidad de Costa Rica)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I198243066","host_organization_name":"Universidad Nacional","host_organization_lineage":["https://openalex.org/I198243066"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE International Work Conference on Bioinspired Intelligence (IWOBI). San Carlos, Costa Rica. 18-20 de julio de 2018","raw_type":"comunicaci\u00f3n de congreso"},{"id":"pmh:oai:kerwa.ucr.ac.cr:10669/86291","is_oa":false,"landing_page_url":"https://hdl.handle.net/10669/86291","pdf_url":null,"source":{"id":"https://openalex.org/S4306400069","display_name":"Investigative News in Education (Universidad de Costa Rica)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I198243066","host_organization_name":"Universidad Nacional","host_organization_lineage":["https://openalex.org/I198243066"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE International Work Conference on Bioinspired Intelligence (IWOBI). San Carlos, Costa Rica. 18-20 de julio de 2018","raw_type":"comunicaci\u00f3n de congreso"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W95152782","https://openalex.org/W1499332833","https://openalex.org/W1533861849","https://openalex.org/W1566256432","https://openalex.org/W1600722501","https://openalex.org/W1736701665","https://openalex.org/W1778816975","https://openalex.org/W1861150963","https://openalex.org/W1902054819","https://openalex.org/W1987992317","https://openalex.org/W1990383786","https://openalex.org/W1990505856","https://openalex.org/W2005708641","https://openalex.org/W2049036695","https://openalex.org/W2064675550","https://openalex.org/W2102003408","https://openalex.org/W2111284386","https://openalex.org/W2124558353","https://openalex.org/W2138857742","https://openalex.org/W2147768505","https://openalex.org/W2293049663","https://openalex.org/W2293255527","https://openalex.org/W2294351487","https://openalex.org/W2294797155","https://openalex.org/W2508231302","https://openalex.org/W2531641781","https://openalex.org/W2715071750","https://openalex.org/W2789740382","https://openalex.org/W2963971656","https://openalex.org/W4294375521","https://openalex.org/W4300458848","https://openalex.org/W4301420498","https://openalex.org/W6603838645","https://openalex.org/W6631943919","https://openalex.org/W6633947590","https://openalex.org/W6638023308","https://openalex.org/W6639125025","https://openalex.org/W6647815124","https://openalex.org/W6680300913","https://openalex.org/W6682778277","https://openalex.org/W6696767757","https://openalex.org/W6696843773"],"related_works":["https://openalex.org/W3013693939","https://openalex.org/W2159052453","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W2734887215","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W3204184292","https://openalex.org/W4386815338","https://openalex.org/W3037110488"],"abstract_inverted_index":{"Several":[0],"attempts":[1],"to":[2,14,23,155],"enhance":[3],"statistical":[4,147],"parametric":[5,148],"speech":[6,21,49,61,149],"synthesis":[7],"have":[8],"contemplated":[9],"deep-learning-based":[10],"postfilters,":[11,104],"which":[12,105],"learn":[13],"perform":[15],"a":[16,37,63,88,100,107],"mapping":[17],"of":[18,54,58,74,96,102,109,115,121,136,160],"the":[19,24,28,52,56,59,94,113,122,128,133,137,146,156,161],"synthetic":[20],"parameters":[22,120],"natural":[25],"ones,":[26],"reducing":[27],"gap":[29],"between":[30],"them.":[31],"In":[32],"this":[33,97],"paper,":[34],"we":[35],"introduce":[36],"new":[38],"pre-training":[39],"approach":[40,68,159],"for":[41,48,84,112],"neural":[42],"networks,":[43],"applied":[44],"in":[45,62,131,144,150],"LSTM-based":[46],"postfilters":[47,85],"synthesis,":[50],"with":[51,70],"objective":[53],"enhancing":[55,145],"quality":[57],"synthesized":[60],"more":[64],"efficient":[65],"manner.":[66],"Our":[67],"begins":[69],"an":[71,82],"auto-regressive":[72],"training":[73,134],"one":[75],"LSTM":[76,138],"network,":[77],"whose":[78],"is":[79],"used":[80],"as":[81],"initialization":[83,98,129],"based":[86],"on":[87,99],"denoising":[89,110],"autoencoder":[90],"architecture.":[91],"We":[92],"show":[93,126],"advantages":[95],"set":[101,114],"multi-stream":[103],"encompass":[106],"collection":[108],"autoencoders":[111],"MFCC":[116],"and":[117,140],"fundamental":[118],"frequency":[119],"artificial":[123],"voice.":[124],"Results":[125],"that":[127],"succeeds":[130],"lowering":[132],"time":[135],"networks":[139],"achieves":[141],"better":[142],"results":[143],"most":[151],"cases,":[152],"when":[153],"compared":[154],"common":[157],"random-initialized":[158],"networks.":[162]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2025-10-10T00:00:00"}
