{"id":"https://openalex.org/W3015347659","doi":"https://doi.org/10.1109/icassp40776.2020.9053337","title":"Gaussian Lpcnet for Multisample Speech Synthesis","display_name":"Gaussian Lpcnet for Multisample Speech Synthesis","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015347659","doi":"https://doi.org/10.1109/icassp40776.2020.9053337","mag":"3015347659"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9053337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079224579","display_name":"Popov Va","orcid":"https://orcid.org/0000-0003-1395-2951"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Vadim Popov","raw_affiliation_strings":["Huawei Technologies Co. Ltd., Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co. Ltd., Moscow, Russia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034257289","display_name":"Mikhail Kudinov","orcid":"https://orcid.org/0000-0002-8555-4891"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mikhail Kudinov","raw_affiliation_strings":["Huawei Technologies Co. Ltd., Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co. Ltd., Moscow, Russia","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025256499","display_name":"Tasnima Sadekova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tasnima Sadekova","raw_affiliation_strings":["Huawei Technologies Co. Ltd., Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co. Ltd., Moscow, Russia","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5079224579"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.8558,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.8824607,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"6204","last_page":"6208"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7986915111541748},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7112871408462524},{"id":"https://openalex.org/keywords/degradation","display_name":"Degradation (telecommunications)","score":0.5722363591194153},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5376890897750854},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.5324462652206421},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4531727433204651},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.44680255651474},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.4397630989551544},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.41450557112693787},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2914060354232788},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.11432862281799316},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.11021497845649719}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7986915111541748},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7112871408462524},{"id":"https://openalex.org/C2779679103","wikidata":"https://www.wikidata.org/wiki/Q5251805","display_name":"Degradation (telecommunications)","level":2,"score":0.5722363591194153},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5376890897750854},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.5324462652206421},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4531727433204651},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.44680255651474},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.4397630989551544},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.41450557112693787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2914060354232788},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.11432862281799316},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.11021497845649719},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9053337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1578856370","https://openalex.org/W1602773783","https://openalex.org/W1973746598","https://openalex.org/W2013020033","https://openalex.org/W2519091744","https://openalex.org/W2584032004","https://openalex.org/W2587284713","https://openalex.org/W2748379347","https://openalex.org/W2769810959","https://openalex.org/W2797310469","https://openalex.org/W2890983311","https://openalex.org/W2899759260","https://openalex.org/W2903739847","https://openalex.org/W2928550135","https://openalex.org/W2943731990","https://openalex.org/W2946200149","https://openalex.org/W2963091184","https://openalex.org/W2963300588","https://openalex.org/W2963782041","https://openalex.org/W2963975282","https://openalex.org/W2964199361","https://openalex.org/W2964243274","https://openalex.org/W2964307104","https://openalex.org/W2970730223","https://openalex.org/W2972333964","https://openalex.org/W2972574864","https://openalex.org/W2972802841","https://openalex.org/W2984862052","https://openalex.org/W4294619240","https://openalex.org/W4298580827","https://openalex.org/W6732429163","https://openalex.org/W6733471323","https://openalex.org/W6748409065","https://openalex.org/W6753855596","https://openalex.org/W6755868737","https://openalex.org/W6757079273","https://openalex.org/W6763832098","https://openalex.org/W6917585676"],"related_works":["https://openalex.org/W2120771489","https://openalex.org/W2051376034","https://openalex.org/W2955597484","https://openalex.org/W3110551121","https://openalex.org/W2131486661","https://openalex.org/W2089240210","https://openalex.org/W2164147372","https://openalex.org/W2550171623","https://openalex.org/W4253660971","https://openalex.org/W2161396743"],"abstract_inverted_index":{"LPCNet":[0,36],"vocoder":[1,71],"has":[2,41],"recently":[3],"been":[4],"presented":[5],"to":[6,16,59,74,105],"TTS":[7],"community":[8],"and":[9,19,46,83,115],"is":[10,38,55,72],"now":[11],"gaining":[12],"increasing":[13],"popularity":[14],"due":[15,58],"its":[17],"effectiveness":[18],"high":[20],"quality":[21,106],"of":[22,35,49,79,94],"the":[23,50,66,69],"speech":[24,48],"synthesized":[25],"with":[26],"it.":[27],"In":[28],"this":[29],"work,":[30],"we":[31,63,108],"present":[32],"a":[33,91],"modification":[34],"that":[37,62,99],"1.5x":[39],"faster,":[40],"twice":[42],"less":[43],"non-zero":[44],"parameters":[45],"synthesizes":[47],"same":[51],"quality.":[52],"Such":[53],"enhancement":[54],"possible":[56],"mostly":[57],"two":[60,86],"features":[61],"introduce":[64],"into":[65],"original":[67],"architecture:":[68],"proposed":[70],"designed":[73],"generate":[75],"16-bit":[76],"signal":[77],"instead":[78],"8-bit":[80],"\u03bc-companded":[81],"signal,":[82],"it":[84],"predicts":[85],"consecutive":[87],"excitation":[88],"values":[89],"at":[90],"time":[92],"independently":[93],"each":[95],"other.":[96],"To":[97],"show":[98],"these":[100],"modifications":[101],"do":[102],"not":[103],"lead":[104],"degradation":[107],"train":[109],"models":[110],"for":[111],"five":[112],"different":[113],"languages":[114],"perform":[116],"extensive":[117],"human":[118],"evaluation.":[119]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
