{"id":"https://openalex.org/W2187234408","doi":"https://doi.org/10.21437/interspeech.2013-669","title":"A hybrid approach to electrolaryngeal speech enhancement based on spectral subtraction and statistical voice conversion","display_name":"A hybrid approach to electrolaryngeal speech enhancement based on spectral subtraction and statistical voice conversion","publication_year":2013,"publication_date":"2013-08-25","ids":{"openalex":"https://openalex.org/W2187234408","doi":"https://doi.org/10.21437/interspeech.2013-669","mag":"2187234408"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2013-669","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2013-669","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2013","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106710403","display_name":"Kou Tanaka","orcid":"https://orcid.org/0009-0003-7107-607X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kou Tanaka","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078330211","display_name":"Tomoki Toda","orcid":"https://orcid.org/0000-0001-8146-1279"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomoki Toda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000692949","display_name":"Graham Neubig","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Graham Neubig","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040108974","display_name":"Sakriani Sakti","orcid":"https://orcid.org/0000-0001-5509-8963"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sakriani Sakti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020994673","display_name":"Satoshi Nakamura","orcid":"https://orcid.org/0000-0001-6956-3803"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Satoshi Nakamura","raw_affiliation_strings":["Nara Institute of Science & Technology#TAB#"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science & Technology#TAB#","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5106710403"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.9152,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.8715591,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3067","last_page":"3071"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13289","display_name":"Infant Health and Development","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/3611","display_name":"Pharmacy"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7052361369132996},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.7007462382316589},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6542989611625671},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.5179471373558044},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.397093802690506},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33265647292137146},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.12316259741783142}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7052361369132996},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.7007462382316589},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6542989611625671},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.5179471373558044},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.397093802690506},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33265647292137146},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.12316259741783142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2013-669","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2013-669","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2013","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1523372075","https://openalex.org/W2022125261","https://openalex.org/W2029434926","https://openalex.org/W2049686551","https://openalex.org/W2056852181","https://openalex.org/W2116593694","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2128653836","https://openalex.org/W2151500768","https://openalex.org/W2154920538","https://openalex.org/W2156142001","https://openalex.org/W2159089611","https://openalex.org/W2161501672","https://openalex.org/W2395578248"],"related_works":["https://openalex.org/W2770665941","https://openalex.org/W3096184950","https://openalex.org/W3135230428","https://openalex.org/W2120771489","https://openalex.org/W2904739811","https://openalex.org/W2275432853","https://openalex.org/W2131711534","https://openalex.org/W2559040841","https://openalex.org/W114661351","https://openalex.org/W4200596008"],"abstract_inverted_index":{"We":[0,155],"present":[1],"a":[2,20,157],"hybrid":[3,158,207],"approach":[4,208],"to":[5,27,30,48,69,151],"improving":[6],"naturalness":[7,106,124,188],"of":[8,125,133,140],"electrolaryngeal":[9,201],"(EL)":[10],"speech":[11,83,127,192],"while":[12,193],"minimizing":[13],"degradation":[14,97,147],"in":[15,98,105,148,153,187],"intelligibility.":[16],"An":[17],"electrolarynx":[18],"is":[19],"device":[21,63],"that":[22],"artificially":[23],"generates":[24],"excitation":[25,51,58,110,131,175],"sounds":[26,44,59,111],"enable":[28],"laryngectomees":[29,36],"produce":[31,38],"EL":[32,41,70,82,126,141,191],"speech.":[33,71],"Although":[34],"proficient":[35],"can":[37],"quite":[39],"intelligible":[40],"speech,":[42,142,202],"it":[43,144],"very":[45],"unnatural":[46],"due":[47],"the":[49,54,57,62,108,116,119,161,181],"mechanical":[50,109],"produced":[52,60],"by":[53,61],"device.":[55],"Moreover,":[56],"often":[64],"leak":[65],"outside,":[66],"adding":[67],"noise":[68,87,162],"To":[72],"address":[73],"these":[74],"issues,":[75],"previous":[76],"work":[77],"has":[78],"proposed":[79,182],"methods":[80],"for":[81,165,173],"enhancement":[84],"through":[85],"either":[86],"reduction":[88,163],"or":[89],"voice":[90,170,205],"conversion.":[91,154],"The":[92,177],"former":[93],"usually":[94,145],"causes":[95,146],"no":[96],"intelligibility":[99,149,195],"but":[100,143],"yields":[101,184],"only":[102],"small":[103],"improvements":[104,186],"as":[107],"remain":[112],"essentially":[113],"unchanged.":[114],"On":[115],"other":[117],"hand,":[118],"latter":[120],"method":[121,159,164,172,183],"significantly":[122],"improves":[123],"using":[128,160],"spectral":[129,167,203],"and":[130,169],"parameters":[132,139,168],"natural":[134],"voices":[135],"converted":[136],"from":[137],"acoustic":[138],"owing":[150],"errors":[152],"propose":[156],"enhancing":[166],"conversion":[171],"predicting":[174],"parameters.":[176],"experimental":[178],"results":[179],"demonstrate":[180],"significant":[185],"compared":[189],"with":[190],"keeping":[194],"high":[196],"enough.":[197],"Index":[198],"Terms:":[199],"speaking-aid,":[200],"subtraction,":[204],"conversion,":[206]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
