{"id":"https://openalex.org/W4414140937","doi":"https://doi.org/10.1109/icmew68306.2025.11152258","title":"Bandwidth Extension System for Throat Microphone Speech Reconstruction","display_name":"Bandwidth Extension System for Throat Microphone Speech Reconstruction","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4414140937","doi":"https://doi.org/10.1109/icmew68306.2025.11152258"},"language":"en","primary_location":{"id":"doi:10.1109/icmew68306.2025.11152258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew68306.2025.11152258","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112529831","display_name":"Yu Bing Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yu Xu","raw_affiliation_strings":["The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103280816","display_name":"Xuexin Qin","orcid":"https://orcid.org/0000-0001-9858-6545"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xiaokai Qin","raw_affiliation_strings":["Nanyang Technological University,College of Computing and Data Science,Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University,College of Computing and Data Science,Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116594555","display_name":"Tianyu Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Tianyu Fan","raw_affiliation_strings":["Nanyang Technological University,College of Computing and Data Science,Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University,College of Computing and Data Science,Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070872826","display_name":"Eng Siong Chng","orcid":"https://orcid.org/0000-0001-6257-7399"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Eng Siong Chng","raw_affiliation_strings":["Institute of Science Tokyo,School of Engineering,Yokohama,Japan"],"affiliations":[{"raw_affiliation_string":"Institute of Science Tokyo,School of Engineering,Yokohama,Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053726259","display_name":"Sheng Li","orcid":"https://orcid.org/0000-0001-7636-3797"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Sheng Li","raw_affiliation_strings":["The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041213266","display_name":"Nobuaki Minematsu","orcid":"https://orcid.org/0000-0002-8778-9555"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nobuaki Minematsu","raw_affiliation_strings":["The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010841595","display_name":"Daisuke Saito","orcid":"https://orcid.org/0000-0003-3200-579X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Daisuke Saito","raw_affiliation_strings":["The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5112529831"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.29557258,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.6915000081062317},{"id":"https://openalex.org/keywords/narrowband","display_name":"Narrowband","score":0.6345000267028809},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5496000051498413},{"id":"https://openalex.org/keywords/bandwidth-extension","display_name":"Bandwidth extension","score":0.5049999952316284},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.4404999911785126},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.42910000681877136},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.3930000066757202},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.37400001287460327}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7674999833106995},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6980999708175659},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.6915000081062317},{"id":"https://openalex.org/C2776096036","wikidata":"https://www.wikidata.org/wiki/Q1140483","display_name":"Narrowband","level":2,"score":0.6345000267028809},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5496000051498413},{"id":"https://openalex.org/C9387945","wikidata":"https://www.wikidata.org/wiki/Q4854770","display_name":"Bandwidth extension","level":4,"score":0.5049999952316284},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.4404999911785126},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.42910000681877136},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.3930000066757202},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.37400001287460327},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.36480000615119934},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.36469998955726624},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28940001130104065},{"id":"https://openalex.org/C36922181","wikidata":"https://www.wikidata.org/wiki/Q7047650","display_name":"Noise-canceling microphone","level":5,"score":0.2883000075817108},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.2644999921321869},{"id":"https://openalex.org/C157138929","wikidata":"https://www.wikidata.org/wiki/Q570","display_name":"Loudspeaker","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.2565000057220459},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.2554999887943268}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icmew68306.2025.11152258","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew68306.2025.11152258","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"},{"id":"pmh:oai:t2r2.star.titech.ac.jp:50734101","is_oa":false,"landing_page_url":"http://t2r2.star.titech.ac.jp/cgi-bin/publicationinfo.cgi?q_publication_content_number=CTT100933504","pdf_url":null,"source":{"id":"https://openalex.org/S4377196385","display_name":"Tokyo Tech Research Repository (Tokyo Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I114531698","host_organization_name":"Tokyo Institute of Technology","host_organization_lineage":["https://openalex.org/I114531698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2166344203","https://openalex.org/W2245745904","https://openalex.org/W2513535794","https://openalex.org/W2765742664","https://openalex.org/W2786825824","https://openalex.org/W2998572311","https://openalex.org/W3160652646","https://openalex.org/W3211264909","https://openalex.org/W4282828401","https://openalex.org/W4297841623","https://openalex.org/W4372341094","https://openalex.org/W4402112024"],"related_works":["https://openalex.org/W2059847929","https://openalex.org/W107154053","https://openalex.org/W4319862422","https://openalex.org/W1971598839","https://openalex.org/W2133828239","https://openalex.org/W3207737697","https://openalex.org/W2017964352","https://openalex.org/W3144767625","https://openalex.org/W2097303478","https://openalex.org/W2900695998"],"abstract_inverted_index":{"The":[0],"throat":[1,26,96],"microphone":[2,97],"is":[3],"effective":[4],"for":[5,18,32,95],"capturing":[6],"speech":[7,19,27,43,51,81],"in":[8],"noisy":[9],"environments":[10],"but":[11],"typically":[12],"produces":[13],"narrowband":[14],"signals,":[15],"requiring":[16],"post-processing":[17],"enhancement.":[20],"Additionally,":[21],"the":[22,79,85],"limited":[23],"availability":[24],"of":[25],"(TS)":[28],"datasets":[29],"poses":[30],"challenges":[31],"system":[33],"development.":[34],"To":[35],"address":[36],"this,":[37],"we":[38],"introduce":[39],"Dent-DDSP,":[40],"a":[41,68],"robust":[42],"generator":[44],"that":[45],"simulates":[46],"TS":[47],"using":[48],"existing":[49],"air-conducted":[50],"(AS)":[52],"datasets.":[53],"We":[54],"employ":[55],"bandwidth":[56],"extension":[57],"(BWE)":[58],"methods":[59],"to":[60],"recover":[61],"missing":[62],"high-frequency":[63],"components":[64],"and":[65,73,84],"use":[66],"TUNet,":[67],"DNN-based":[69],"model":[70],"combining":[71],"transformer":[72],"UNet":[74],"structures.":[75],"Experimental":[76],"results":[77],"demonstrate":[78],"superior":[80],"quality":[82],"enhancement":[83],"unit":[86],"language":[87],"model\u2019s":[88],"better":[89],"perceptual":[90],"performance,":[91],"highlighting":[92],"promising":[93],"avenues":[94],"applications.":[98]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
