{"id":"https://openalex.org/W124515498","doi":"https://doi.org/10.21437/interspeech.2004-596","title":"Application of voice conversion to hearing-impaired Mandarin speech enhancement","display_name":"Application of voice conversion to hearing-impaired Mandarin speech enhancement","publication_year":2004,"publication_date":"2004-10-04","ids":{"openalex":"https://openalex.org/W124515498","doi":"https://doi.org/10.21437/interspeech.2004-596","mag":"124515498"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2004-596","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-596","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083609304","display_name":"Chen-Long Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Chen-Long Lee","raw_affiliation_strings":["National Yang Ming Chiao Tung University"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043140115","display_name":"Wen\u2010Whei Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen-Whei Chang","raw_affiliation_strings":["\u96fb\u6a5f\u5de5\u7a0b\u5b78\u7cfb"],"affiliations":[{"raw_affiliation_string":"\u96fb\u6a5f\u5de5\u7a0b\u5b78\u7cfb","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111556710","display_name":"Yuan-Chuan Chiang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210154699","display_name":"National Hsinchu University of Education","ror":"https://ror.org/05prep819","country_code":"TW","type":"education","lineage":["https://openalex.org/I4210154699"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yuan-Chuan Chiang","raw_affiliation_strings":["National Hsinchu Teachers College"],"affiliations":[{"raw_affiliation_string":"National Hsinchu Teachers College","institution_ids":["https://openalex.org/I4210154699"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5083609304"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.01564017,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1829","last_page":"1832"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.8712388277053833},{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.7896705865859985},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7429909706115723},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6766663789749146},{"id":"https://openalex.org/keywords/hearing-impaired","display_name":"Hearing impaired","score":0.6417227983474731},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5859524011611938},{"id":"https://openalex.org/keywords/syllable","display_name":"Syllable","score":0.4901183545589447},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.45186617970466614},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.45176368951797485},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.4454689919948578},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4381561577320099},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.42488640546798706},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28471916913986206},{"id":"https://openalex.org/keywords/audiology","display_name":"Audiology","score":0.2169376015663147},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.07589754462242126}],"concepts":[{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.8712388277053833},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.7896705865859985},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7429909706115723},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6766663789749146},{"id":"https://openalex.org/C3020736805","wikidata":"https://www.wikidata.org/wiki/Q16035842","display_name":"Hearing impaired","level":2,"score":0.6417227983474731},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5859524011611938},{"id":"https://openalex.org/C109089402","wikidata":"https://www.wikidata.org/wiki/Q8188","display_name":"Syllable","level":2,"score":0.4901183545589447},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.45186617970466614},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.45176368951797485},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.4454689919948578},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4381561577320099},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.42488640546798706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28471916913986206},{"id":"https://openalex.org/C548259974","wikidata":"https://www.wikidata.org/wiki/Q569965","display_name":"Audiology","level":1,"score":0.2169376015663147},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.07589754462242126},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2004-596","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-596","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6899999976158142,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W1560013842","https://openalex.org/W2045122003","https://openalex.org/W2049633694","https://openalex.org/W2083603732","https://openalex.org/W2116756305","https://openalex.org/W2156142001","https://openalex.org/W2164764235"],"related_works":["https://openalex.org/W1986772939","https://openalex.org/W2081919107","https://openalex.org/W2037635165","https://openalex.org/W2738829087","https://openalex.org/W2089150823","https://openalex.org/W2542062716","https://openalex.org/W1505346162","https://openalex.org/W3115948027","https://openalex.org/W4200562864","https://openalex.org/W2405110677"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"the":[3,18,51,72,77],"application":[4],"of":[5,21,79],"voice":[6],"conversion":[7,54],"to":[8],"hearing-impaired":[9,46,80],"Mandarin":[10,31,81],"speech":[11],"enhancement.":[12],"The":[13],"system":[14,74],"is":[15,55],"based":[16,62],"on":[17,63],"combined":[19],"use":[20],"a":[22,27,37,58,64],"sinusoidal":[23],"analysis-synthesis":[24],"model":[25],"and":[26,47],"priori":[28],"knowledge":[29],"about":[30],"syllable":[32],"phonetic":[33],"structures.":[34],"We":[35],"propose":[36],"time-scale":[38],"modification":[39],"algorithm":[40],"that":[41,71],"finds":[42],"accurate":[43],"alignments":[44],"between":[45],"normal":[48],"utterances.":[49],"Using":[50],"alignments,":[52],"spectral":[53],"performed":[56],"by":[57],"continuous":[59],"probabilistic":[60],"transform":[61],"Gaussian":[65],"mixture":[66],"model.":[67],"Simulation":[68],"results":[69],"indicate":[70],"proposed":[73],"can":[75],"improve":[76],"intelligibility":[78],"speech.":[82]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
