{"id":"https://openalex.org/W4403913173","doi":"https://doi.org/10.1145/3678957.3685720","title":"Whispering Wearables: Multimodal Approach to Silent Speech Recognition with Head-Worn Devices","display_name":"Whispering Wearables: Multimodal Approach to Silent Speech Recognition with Head-Worn Devices","publication_year":2024,"publication_date":"2024-10-30","ids":{"openalex":"https://openalex.org/W4403913173","doi":"https://doi.org/10.1145/3678957.3685720"},"language":"en","primary_location":{"id":"doi:10.1145/3678957.3685720","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3678957.3685720","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conference on Multimodel Interaction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075120384","display_name":"Tanmay Srivastava","orcid":"https://orcid.org/0000-0003-0144-7931"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tanmay Srivastava","raw_affiliation_strings":["Computer Science, Stony Brook University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science, Stony Brook University, United States","institution_ids":["https://openalex.org/I59553526"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015711811","display_name":"R. Michael Winters","orcid":"https://orcid.org/0000-0002-8874-9184"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"R. Michael Winters","raw_affiliation_strings":["Microsoft Research Labs, Microsoft Corporation, United States"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Labs, Microsoft Corporation, United States","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022706370","display_name":"Thomas M. Gable","orcid":"https://orcid.org/0000-0002-3033-3565"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas Gable","raw_affiliation_strings":["Microsoft Corporation, United States"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, United States","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034708041","display_name":"Yu-Te Wang","orcid":"https://orcid.org/0000-0001-5576-5236"},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yu Te Wang","raw_affiliation_strings":["Academia Sinica, Taiwan"],"affiliations":[{"raw_affiliation_string":"Academia Sinica, Taiwan","institution_ids":["https://openalex.org/I84653119"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114465164","display_name":"Teresa LaScala","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Teresa LaScala","raw_affiliation_strings":["Microsoft Research Labs, Microsoft Corporation, United States"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Labs, Microsoft Corporation, United States","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007425970","display_name":"Ivan Tashev","orcid":"https://orcid.org/0000-0002-2263-2047"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ivan J. Tashev","raw_affiliation_strings":["Microsoft Research Labs, Microsoft Corporation, United States"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Labs, Microsoft Corporation, United States","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5075120384"],"corresponding_institution_ids":["https://openalex.org/I59553526"],"apc_list":null,"apc_paid":null,"fwci":3.8224,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.94435022,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"214","last_page":"223"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.698999285697937},{"id":"https://openalex.org/keywords/wearable-computer","display_name":"Wearable computer","score":0.6805293560028076},{"id":"https://openalex.org/keywords/head","display_name":"Head (geology)","score":0.5987874269485474},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5693652033805847},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.13784927129745483}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.698999285697937},{"id":"https://openalex.org/C150594956","wikidata":"https://www.wikidata.org/wiki/Q1334829","display_name":"Wearable computer","level":2,"score":0.6805293560028076},{"id":"https://openalex.org/C2780312720","wikidata":"https://www.wikidata.org/wiki/Q5689100","display_name":"Head (geology)","level":2,"score":0.5987874269485474},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5693652033805847},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.13784927129745483},{"id":"https://openalex.org/C114793014","wikidata":"https://www.wikidata.org/wiki/Q52109","display_name":"Geomorphology","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3678957.3685720","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3678957.3685720","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conference on Multimodel Interaction","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5299999713897705,"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W157162768","https://openalex.org/W1969139822","https://openalex.org/W1986057074","https://openalex.org/W1995735739","https://openalex.org/W2008517591","https://openalex.org/W2044169976","https://openalex.org/W2049576927","https://openalex.org/W2057959448","https://openalex.org/W2073538956","https://openalex.org/W2098368939","https://openalex.org/W2110288969","https://openalex.org/W2125666044","https://openalex.org/W2138527036","https://openalex.org/W2144855640","https://openalex.org/W2151047074","https://openalex.org/W2158100192","https://openalex.org/W2334809025","https://openalex.org/W2344757691","https://openalex.org/W2483158495","https://openalex.org/W2490737928","https://openalex.org/W2586794626","https://openalex.org/W2764166175","https://openalex.org/W2770785043","https://openalex.org/W2790849987","https://openalex.org/W2793257307","https://openalex.org/W2806172474","https://openalex.org/W2809447336","https://openalex.org/W2853586540","https://openalex.org/W2889257687","https://openalex.org/W2897318954","https://openalex.org/W2898272312","https://openalex.org/W2919905642","https://openalex.org/W2921295135","https://openalex.org/W2941048526","https://openalex.org/W3004196347","https://openalex.org/W3083703874","https://openalex.org/W3089228032","https://openalex.org/W3091762102","https://openalex.org/W3094989392","https://openalex.org/W3113878582","https://openalex.org/W3130809619","https://openalex.org/W3153828612","https://openalex.org/W3160833628","https://openalex.org/W3163934237","https://openalex.org/W3179013167","https://openalex.org/W3182888500","https://openalex.org/W3213319487","https://openalex.org/W4200186631","https://openalex.org/W4205275033","https://openalex.org/W4210767182","https://openalex.org/W4225124540","https://openalex.org/W4239737559","https://openalex.org/W4242177601","https://openalex.org/W4249938195","https://openalex.org/W4294891788","https://openalex.org/W4313048962","https://openalex.org/W4366547682","https://openalex.org/W4387321423","https://openalex.org/W4387421591"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Silent":[0],"speech":[1,42,91,130,154,168,200,233],"recognition":[2,43],"has":[3],"emerged":[4],"as":[5,214],"a":[6,24,95],"promising":[7],"approach":[8],"for":[9,177,206,235],"enabling":[10],"hands-free":[11],"and":[12,33,62,72,76,85,101,119,126,140,167,173,208,217],"discreet":[13,209],"interaction":[14,210,234],"with":[15,89,98,106,153,183,211],"head-worn":[16,195],"devices.":[17,46],"In":[18],"this":[19],"paper,":[20],"we":[21],"present":[22],"QuietSync,":[23],"multimodal":[25],"system":[26,112,160,229],"that":[27,158],"combines":[28],"inertial":[29],"measurement":[30],"unit":[31],"(IMU)":[32],"contact":[34],"electrode":[35],"(ExG)":[36],"signals":[37,121],"to":[38,52,81,122,197,230],"achieve":[39],"accurate":[40],"silent":[41,90,129,199,232],"using":[44,193],"off-the-shelf":[45,194],"QuietSync":[47,225],"utilizes":[48],"an":[49,107],"IMU":[50,118,133],"attached":[51],"the":[53,57,60,68,74,114,124,138,144,165,171,190,220,227],"lower":[54],"part":[55],"of":[56,109,117,128,137,170,179,192,222],"headphones":[58],"near":[59],"ear":[61],"strategically":[63],"places":[64],"ExG":[65,120,145],"electrodes":[66,146],"on":[67],"headphones,":[69],"glasses":[70],"(nose":[71],"behind":[73],"ear),":[75],"face":[77],"(for":[78],"VR":[79],"applications)":[80],"capture":[82],"subtle":[83,135],"movements":[84,136],"muscle":[86,150],"activity":[87,151],"associated":[88,152],"production.":[92,155],"We":[93,156],"conducted":[94],"user":[96],"study":[97],"9":[99],"participants":[100],"successfully":[102],"recognized":[103],"12":[104],"commands":[105],"accuracy":[108],"94.2%.":[110],"Our":[111,187],"leverages":[113],"complementary":[115],"nature":[116],"enhance":[123],"robustness":[125],"reliability":[127],"recognition.":[131],"The":[132],"captures":[134],"jaw":[139],"facial":[141],"muscles,":[142],"while":[143],"detect":[147],"low-amplitude":[148],"surface":[149],"show":[157],"our":[159,223],"is":[161,226],"not":[162],"affected":[163],"by":[164],"length":[166],"mannerisms":[169],"commands,":[172],"can":[174],"be":[175],"fine-tuned":[176],"users":[178],"varied":[180],"native":[181],"languages":[182],"only":[184],"5":[185],"samples.":[186],"findings":[188],"demonstrate":[189],"feasibility":[191],"devices":[196,212],"enable":[198,231],"recognition,":[201],"opening":[202],"up":[203],"new":[204],"possibilities":[205],"seamless":[207],"such":[213],"VR/AR":[215],"headsets":[216],"earables.":[218],"To":[219],"best":[221],"knowledge,":[224],"first":[228],"multiple":[236],"form":[237],"factors.":[238]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":3}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
