{"id":"https://openalex.org/W2156060621","doi":"https://doi.org/10.1109/icassp.2009.4960405","title":"Voice conversion for various types of body transmitted speech","display_name":"Voice conversion for various types of body transmitted speech","publication_year":2009,"publication_date":"2009-04-01","ids":{"openalex":"https://openalex.org/W2156060621","doi":"https://doi.org/10.1109/icassp.2009.4960405","mag":"2156060621"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2009.4960405","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2009.4960405","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://naist.repo.nii.ac.jp/records/4645","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078330211","display_name":"Tomoki Toda","orcid":"https://orcid.org/0000-0001-8146-1279"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Tomoki Toda","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031967669","display_name":"Keigo Nakamura","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Keigo Nakamura","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075350740","display_name":"Hidehiko Sekimoto","orcid":null},"institutions":[{"id":"https://openalex.org/I146230289","display_name":"Omron (Japan)","ror":"https://ror.org/00q0w1h45","country_code":"JP","type":"company","lineage":["https://openalex.org/I146230289"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hidehiko Sekimoto","raw_affiliation_strings":["OMRON Corporation, Japan"],"affiliations":[{"raw_affiliation_string":"OMRON Corporation, Japan","institution_ids":["https://openalex.org/I146230289"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021868389","display_name":"Kiyohiro Shikano","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kiyohiro Shikano","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5078330211"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":4.2852,"has_fulltext":true,"cited_by_count":31,"citation_normalized_percentile":{"value":0.94535809,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3601","last_page":"3604"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7893587946891785},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7397624254226685},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.6025406122207642},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5750178098678589},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5448744893074036},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.504878580570221},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.45656687021255493},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.4321593642234802},{"id":"https://openalex.org/keywords/background-noise","display_name":"Background noise","score":0.32541754841804504},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27662965655326843},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.14804059267044067}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7893587946891785},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7397624254226685},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.6025406122207642},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5750178098678589},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5448744893074036},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.504878580570221},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.45656687021255493},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.4321593642234802},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.32541754841804504},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27662965655326843},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14804059267044067},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/icassp.2009.4960405","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2009.4960405","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.157.7230","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.157.7230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://spalab.naist.jp/~tomoki/Tomoki/Conferences/ICASSP2009_BTVC.pdf","raw_type":"text"},{"id":"pmh:oai:irdb.nii.ac.jp:01146:0005783096","is_oa":true,"landing_page_url":"https://naist.repo.nii.ac.jp/records/4645","pdf_url":null,"source":{"id":"https://openalex.org/S7407056385","display_name":"Institutional Repositories DataBase (IRDB)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I184597095","host_organization_name":"National Institute of Informatics","host_organization_lineage":["https://openalex.org/I184597095"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":{"id":"pmh:oai:irdb.nii.ac.jp:01146:0005783096","is_oa":true,"landing_page_url":"https://naist.repo.nii.ac.jp/records/4645","pdf_url":null,"source":{"id":"https://openalex.org/S7407056385","display_name":"Institutional Repositories DataBase (IRDB)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I184597095","host_organization_name":"National Institute of Informatics","host_organization_lineage":["https://openalex.org/I184597095"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W91932436","https://openalex.org/W1484904337","https://openalex.org/W1491561031","https://openalex.org/W1523372075","https://openalex.org/W1540787848","https://openalex.org/W1550001449","https://openalex.org/W1558063916","https://openalex.org/W1566744681","https://openalex.org/W1582631065","https://openalex.org/W1991590998","https://openalex.org/W1991893800","https://openalex.org/W2011916518","https://openalex.org/W2049686551","https://openalex.org/W2078435788","https://openalex.org/W2117193121","https://openalex.org/W2120605154","https://openalex.org/W2123003832","https://openalex.org/W2141684970","https://openalex.org/W2156142001","https://openalex.org/W2943553228","https://openalex.org/W4402490932","https://openalex.org/W6603833124","https://openalex.org/W6631309588","https://openalex.org/W6632967009","https://openalex.org/W6633899882","https://openalex.org/W6634654710"],"related_works":["https://openalex.org/W2120605154","https://openalex.org/W2156142001","https://openalex.org/W2123003832","https://openalex.org/W2049686551","https://openalex.org/W1991590998","https://openalex.org/W2078435788","https://openalex.org/W2248536413","https://openalex.org/W2008120082","https://openalex.org/W1982854652","https://openalex.org/W1552784139","https://openalex.org/W1597274768","https://openalex.org/W3149890502","https://openalex.org/W2860196236","https://openalex.org/W2621540445","https://openalex.org/W3118026694","https://openalex.org/W2896834262","https://openalex.org/W948130709","https://openalex.org/W1591575995","https://openalex.org/W3057604687","https://openalex.org/W2251578476"],"abstract_inverted_index":{"In":[0,42],"this":[1],"paper,":[2],"we":[3,69],"review":[4],"our":[5,45],"proposed":[6,47,91],"statistical":[7],"voice":[8],"conversion":[9,28,72],"approaches":[10],"to":[11,33,38,44],"enhancing":[12,50,61,75],"various":[13],"types":[14],"of":[15,49,60,74,98],"body":[16,51,62,76,99],"transmitted":[17,26,52,63,77,100],"speech":[18,27,40,54,57,65,79,83],"captured":[19],"with":[20],"non-audible":[21],"murmur":[22],"(NAM)":[23],"microphone.":[24],"Body":[25],"is":[29],"a":[30,35],"potential":[31],"technique":[32],"bring":[34],"new":[36],"paradigm":[37],"human-to-human":[39],"communication.":[41,84],"addition":[43],"previously":[46],"methods":[48,73,92],"unvoiced":[53],"for":[55,66,80],"silent":[56],"communication":[58],"and":[59],"artificial":[64],"speaking":[67],"aid,":[68],"further":[70],"propose":[71],"voiced":[78,101],"noise":[81],"robust":[82],"An":[85],"experimental":[86],"result":[87],"demonstrates":[88],"that":[89],"the":[90],"yield":[93],"significant":[94],"improvements":[95],"in":[96],"quality":[97],"speech.":[102]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
