{"id":"https://openalex.org/W4400032976","doi":"https://doi.org/10.1109/tmc.2024.3419170","title":"UltraSR: Silent Speech Reconstruction via Acoustic Sensing","display_name":"UltraSR: Silent Speech Reconstruction via Acoustic Sensing","publication_year":2024,"publication_date":"2024-06-26","ids":{"openalex":"https://openalex.org/W4400032976","doi":"https://doi.org/10.1109/tmc.2024.3419170"},"language":"en","primary_location":{"id":"doi:10.1109/tmc.2024.3419170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2024.3419170","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050655047","display_name":"Yongjian Fu","orcid":"https://orcid.org/0000-0001-8481-2644"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yongjian Fu","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101765621","display_name":"Shuning Wang","orcid":"https://orcid.org/0000-0002-9727-1434"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuning Wang","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066047713","display_name":"Linghui Zhong","orcid":"https://orcid.org/0000-0003-2178-5073"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linghui Zhong","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University, Changsha, Hunan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University, Changsha, Hunan, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052862237","display_name":"Lili Chen","orcid":"https://orcid.org/0000-0002-6630-0976"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lili Chen","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015419107","display_name":"Ju Ren","orcid":"https://orcid.org/0000-0003-2782-183X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ju Ren","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069049205","display_name":"Yaoxue Zhang","orcid":"https://orcid.org/0000-0001-6717-461X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaoxue Zhang","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5050655047"],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":null,"apc_paid":null,"fwci":3.415,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.93174145,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"23","issue":"12","first_page":"12848","last_page":"12865"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9315000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9315000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9307000041007996,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7723838090896606},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.622300386428833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7723838090896606},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.622300386428833}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmc.2024.3419170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2024.3419170","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4285073634","display_name":null,"funder_award_id":"62341201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4461067470","display_name":null,"funder_award_id":"62122095","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4936291841","display_name":null,"funder_award_id":"62072472","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F3230804744","display_name":"Guoqiang Institute, Tsinghua University","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1975163393","https://openalex.org/W2043199434","https://openalex.org/W2067295501","https://openalex.org/W2079735306","https://openalex.org/W2092889652","https://openalex.org/W2138621090","https://openalex.org/W2156279557","https://openalex.org/W2194775991","https://openalex.org/W2322064186","https://openalex.org/W2394945029","https://openalex.org/W2419247625","https://openalex.org/W2516001803","https://openalex.org/W2587706859","https://openalex.org/W2746457594","https://openalex.org/W2764166175","https://openalex.org/W2765636281","https://openalex.org/W2791862028","https://openalex.org/W2795038031","https://openalex.org/W2832631560","https://openalex.org/W2940177920","https://openalex.org/W2940585064","https://openalex.org/W2941048526","https://openalex.org/W2962801832","https://openalex.org/W2962915147","https://openalex.org/W2963019222","https://openalex.org/W2963073614","https://openalex.org/W2963091184","https://openalex.org/W2963192365","https://openalex.org/W2963206679","https://openalex.org/W2963216553","https://openalex.org/W2964247977","https://openalex.org/W2968379763","https://openalex.org/W3004196347","https://openalex.org/W3010673682","https://openalex.org/W3035626590","https://openalex.org/W3083703874","https://openalex.org/W3105229878","https://openalex.org/W3118639493","https://openalex.org/W3140645045","https://openalex.org/W3143308704","https://openalex.org/W3144915432","https://openalex.org/W3159134136","https://openalex.org/W3198533616","https://openalex.org/W3201134189","https://openalex.org/W3207984187","https://openalex.org/W4213171936","https://openalex.org/W4220726235","https://openalex.org/W4226050909","https://openalex.org/W4237723258","https://openalex.org/W4256527044","https://openalex.org/W4294891759","https://openalex.org/W4294891893","https://openalex.org/W4320060010","https://openalex.org/W4392499786","https://openalex.org/W4395685900","https://openalex.org/W6661954145","https://openalex.org/W6678815747","https://openalex.org/W6697974390","https://openalex.org/W6732872814","https://openalex.org/W6745388339","https://openalex.org/W6745740328","https://openalex.org/W6755207826","https://openalex.org/W6762114000","https://openalex.org/W6783596713","https://openalex.org/W6862504488"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Silent":[0],"Speech":[1],"Interfaces":[2],"(SSI)":[3],"have":[4],"been":[5],"developed":[6],"to":[7,114,128,153,213],"convert":[8],"silent":[9,138],"articulatory":[10,101],"gestures":[11,102,156],"into":[12],"speech,":[13],"aiding":[14],"communication":[15],"in":[16,44,67,189],"public":[17],"spaces":[18],"and":[19,78,120,186,207],"assisting":[20],"individuals":[21],"with":[22,218],"aphasia.":[23],"Previous":[24],"SSIs,":[25],"which":[26],"rely":[27],"on":[28,57,103,182],"wearable":[29],"devices":[30],"or":[31,39],"cameras,":[32],"often":[33],"pose":[34],"issues":[35],"like":[36],"prolonged":[37],"contact":[38],"privacy":[40],"risks.":[41],"Recent":[42],"advancements":[43],"acoustic":[45],"sensing":[46,87],"present":[47],"new":[48,123,216],"opportunities":[49],"for":[50,90,164,177,215],"gesture":[51],"sensing,":[52],"but":[53],"they":[54],"typically":[55],"focus":[56],"content":[58],"classification":[59],"rather":[60],"than":[61],"reconstructing":[62],"audible":[63,92,135],"speech.":[64],"This":[65],"results":[66],"the":[68,97,132,141,209],"loss":[69],"of":[70,99,134,140,144,222],"crucial":[71],"speech":[72,93,129,136,232],"characteristics":[73],"such":[74],"as":[75,203,205],"rate,":[76],"intonation,":[77],"emotion.In":[79],"this":[80],"paper,":[81],"we":[82],"propose":[83],"UltraSR,":[84],"a":[85,109,122,171,183,198],"novel":[86],"system":[88],"designed":[89],"accurate":[91],"reconstruction":[94,133],"by":[95],"analyzing":[96],"disturbance":[98],"tiny":[100],"reflected":[104],"ultrasound":[105,127,223],"signals.":[106],"UltraSR":[107,148,181,195],"employs":[108],"multi-scale":[110],"feature":[111],"extraction":[112],"scheme":[113],"aggregate":[115],"information":[116],"from":[117,137,157,211],"multiple":[118],"views":[119],"introduces":[121],"model":[124,166],"that":[125,194],"maps":[126],"signals,":[130],"enabling":[131],"gestures.Instead":[139],"laborious":[142],"collection":[143],"massive":[145],"training":[146],"data,":[147,224],"constructs":[149],"an":[150],"inverse":[151],"task":[152],"generate":[154],"virtual":[155],"widely":[158],"available":[159],"audio":[160],"(e.g.,":[161],"phone":[162],"calls)":[163],"efficient":[165],"training.":[167],"Additionally,":[168],"it":[169,188],"incorporates":[170],"finetuning":[172],"mechanism":[173],"using":[174],"unlabeled":[175],"data":[176],"user":[178],"adaptation.We":[179],"implemented":[180],"portable":[184],"smartphone":[185],"evaluated":[187],"various":[190],"environments.":[191],"Results":[192],"show":[193],"can":[196],"achieve":[197],"Character":[199],"Error":[200],"Rate":[201],"(CER)":[202],"low":[204],"5.22%":[206],"reduce":[208],"CER":[210],"80.13%":[212],"6.31%":[214],"users":[217],"only":[219],"1":[220],"hour":[221],"outperforming":[225],"state-of-the-art":[226],"acoustic-based":[227],"approaches":[228],"while":[229],"preserving":[230],"rich":[231],"information.":[233]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
