{"id":"https://openalex.org/W4408147558","doi":"https://doi.org/10.1145/3712288","title":"WearSE: Enabling Streaming Speech Enhancement on Eyewear Using Acoustic Sensing","display_name":"WearSE: Enabling Streaming Speech Enhancement on Eyewear Using Acoustic Sensing","publication_year":2025,"publication_date":"2025-03-03","ids":{"openalex":"https://openalex.org/W4408147558","doi":"https://doi.org/10.1145/3712288"},"language":"en","primary_location":{"id":"doi:10.1145/3712288","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712288","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3712288","source":{"id":"https://openalex.org/S4210219751","display_name":"Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies","issn_l":"2474-9567","issn":["2474-9567"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3712288","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100401577","display_name":"Qian Zhang","orcid":"https://orcid.org/0000-0001-7708-8694"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qian Zhang","raw_affiliation_strings":["Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033242925","display_name":"Kaiyi Guo","orcid":"https://orcid.org/0009-0004-5639-1837"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiyi Guo","raw_affiliation_strings":["Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yifei Yang","orcid":"https://orcid.org/0009-0004-0233-4394"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifei Yang","raw_affiliation_strings":["Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100391426","display_name":"Dong Wang","orcid":"https://orcid.org/0000-0001-8444-1636"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Wang","raw_affiliation_strings":["Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100401577"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":5.5457,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.95121826,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"9","issue":"1","first_page":"1","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13289","display_name":"Infant Health and Development","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/3611","display_name":"Pharmacy"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/eyewear","display_name":"Eyewear","score":0.9329593181610107},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.583648145198822},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.4136647582054138},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.36097681522369385},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09440794587135315},{"id":"https://openalex.org/keywords/optics","display_name":"Optics","score":0.07840195298194885}],"concepts":[{"id":"https://openalex.org/C2780527195","wikidata":"https://www.wikidata.org/wiki/Q5422874","display_name":"Eyewear","level":2,"score":0.9329593181610107},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.583648145198822},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.4136647582054138},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.36097681522369385},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09440794587135315},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.07840195298194885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3712288","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712288","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3712288","source":{"id":"https://openalex.org/S4210219751","display_name":"Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies","issn_l":"2474-9567","issn":["2474-9567"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3712288","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712288","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3712288","source":{"id":"https://openalex.org/S4210219751","display_name":"Proceedings of the ACM on Interactive Mobile Wearable and Ubiquitous Technologies","issn_l":"2474-9567","issn":["2474-9567"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5043351475","display_name":null,"funder_award_id":"NSFC 62102245","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4408147558.pdf"},"referenced_works_count":66,"referenced_works":["https://openalex.org/W1545025361","https://openalex.org/W2013608223","https://openalex.org/W2034082908","https://openalex.org/W2044893557","https://openalex.org/W2048142341","https://openalex.org/W2069681747","https://openalex.org/W2100417866","https://openalex.org/W2149425615","https://openalex.org/W2159202424","https://openalex.org/W2291877678","https://openalex.org/W2399593873","https://openalex.org/W2405774341","https://openalex.org/W2769533150","https://openalex.org/W2783985400","https://openalex.org/W2912794432","https://openalex.org/W2912868098","https://openalex.org/W2913017407","https://openalex.org/W2952218014","https://openalex.org/W2962866211","https://openalex.org/W2963242190","https://openalex.org/W2964171275","https://openalex.org/W2977240732","https://openalex.org/W2998161426","https://openalex.org/W3010673682","https://openalex.org/W3011424113","https://openalex.org/W3108244215","https://openalex.org/W3113878582","https://openalex.org/W3140645045","https://openalex.org/W3142719664","https://openalex.org/W3144915432","https://openalex.org/W3175849636","https://openalex.org/W3182657421","https://openalex.org/W3201134189","https://openalex.org/W3213107273","https://openalex.org/W3217415709","https://openalex.org/W4200186631","https://openalex.org/W4205097557","https://openalex.org/W4236976245","https://openalex.org/W4283031696","https://openalex.org/W4285815056","https://openalex.org/W4289665794","https://openalex.org/W4294891920","https://openalex.org/W4294892047","https://openalex.org/W4302446929","https://openalex.org/W4317927921","https://openalex.org/W4317928033","https://openalex.org/W4319837309","https://openalex.org/W4322731291","https://openalex.org/W4360991426","https://openalex.org/W4366547682","https://openalex.org/W4367046449","https://openalex.org/W4367046620","https://openalex.org/W4380925562","https://openalex.org/W4380928279","https://openalex.org/W4387087441","https://openalex.org/W4387227775","https://openalex.org/W4392019525","https://openalex.org/W4392120932","https://openalex.org/W4392931031","https://openalex.org/W4393290239","https://openalex.org/W4396833213","https://openalex.org/W4396919231","https://openalex.org/W4396919354","https://openalex.org/W4396919631","https://openalex.org/W4402349786","https://openalex.org/W4402350869"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2133527807","https://openalex.org/W2294000795","https://openalex.org/W2972340384","https://openalex.org/W2972915848","https://openalex.org/W3014431668","https://openalex.org/W2895531758","https://openalex.org/W3016294780"],"abstract_inverted_index":{"Smart":[0],"eyewear":[1,46,194],"has":[2],"rapidly":[3],"evolved":[4],"in":[5,80,205],"recent":[6],"years,":[7],"yet":[8],"its":[9],"mobile":[10,81,132],"and":[11,38,42,70,112,169],"in-the-wild":[12],"characteristics":[13],"often":[14],"make":[15],"voice":[16],"interactions":[17],"on":[18,45,72,131,215],"such":[19],"devices":[20],"susceptible":[21],"to":[22,47,62,88,147],"external":[23],"interferences.":[24,98],"In":[25,175],"this":[26],"paper,":[27],"we":[28,83,100,141],"introduce":[29],"WearSE,":[30],"a":[31,85,102,119,143,153,166],"system":[32,168],"that":[33,107,197],"utilizes":[34],"acoustic":[35,93],"signals":[36],"emitted":[37],"received":[39],"by":[40],"speakers":[41],"microphones":[43],"mounted":[44],"perceive":[48],"facial":[49],"movements":[50],"during":[51],"speech,":[52],"achieving":[53],"multimodal":[54],"speech":[55,104,116,159,187],"enhancement.":[56],"WearSE":[57,172,198,212],"incorporates":[58],"three":[59],"key":[60],"designs":[61],"meet":[63],"the":[64,77,90,110,115,136],"high":[65],"demands":[66,124],"for":[67,161],"real-time":[68,129],"operation":[69,130],"robustness":[71],"smart":[73,193],"eyewear.":[74],"First,":[75],"considering":[76],"frequent":[78],"use":[79],"scenarios,":[82,177],"design":[84,142],"sensing-enhanced":[86],"network":[87,106,121,162],"amplify":[89],"capability":[91],"of":[92,114,138,156,211],"sensing,":[94],"eliminating":[95],"dynamic":[96],"multipath":[97],"Second,":[99],"develop":[101],"lightweight":[103],"enhancement":[105,188],"enhances":[108],"both":[109],"amplitude":[111],"phase":[113],"spectrum.":[117],"Through":[118],"casual":[120],"design,":[122],"computational":[123],"are":[125],"significantly":[126,199],"reduced,":[127],"ensuring":[128],"devices.":[133,207],"Third,":[134],"addressing":[135],"scarcity":[137],"paired":[139],"data,":[140],"memory-based":[144],"back-translation":[145],"mechanism":[146],"generate":[148],"pseudo-acoustic":[149],"sensing":[150],"data":[151,160],"using":[152],"large":[154],"amount":[155],"publicly":[157],"available":[158,214],"training.":[163],"We":[164],"construct":[165],"prototype":[167],"extensively":[170],"evaluate":[171],"through":[173],"experiments.":[174],"multi-speaker":[176],"our":[178],"approach":[179],"exhibits":[180],"much":[181],"better":[182],"performance":[183],"than":[184],"pure":[185],"audio":[186,209],"methods.":[189],"Comparisons":[190],"with":[191],"commercial":[192],"also":[195],"demonstrate":[196],"surpasses":[200],"existing":[201],"noise":[202],"reduction":[203],"algorithms":[204],"these":[206],"The":[208],"demo":[210],"is":[213],"https://github.com/WearSE/wearse.github.io.":[216]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
