{"id":"https://openalex.org/W4281392593","doi":"https://doi.org/10.1145/3488932.3517420","title":"SUPERVOICE","display_name":"SUPERVOICE","publication_year":2022,"publication_date":"2022-05-24","ids":{"openalex":"https://openalex.org/W4281392593","doi":"https://doi.org/10.1145/3488932.3517420"},"language":"en","primary_location":{"id":"doi:10.1145/3488932.3517420","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3488932.3517420","pdf_url":null,"source":{"id":"https://openalex.org/S4363609011","display_name":"Proceedings of the 2022 ACM on Asia Conference on Computer and Communications Security","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 ACM on Asia Conference on Computer and Communications Security","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035545617","display_name":"Hanqing Guo","orcid":"https://orcid.org/0000-0003-3779-4679"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hanqing Guo","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042277127","display_name":"Qiben Yan","orcid":"https://orcid.org/0000-0001-6272-7668"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qiben Yan","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085356579","display_name":"Nikolay Ivanov","orcid":"https://orcid.org/0000-0002-2325-2847"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nikolay Ivanov","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041988267","display_name":"Ying Zhu","orcid":"https://orcid.org/0000-0002-5708-3252"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ying Zhu","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100630881","display_name":"Li Xiao","orcid":"https://orcid.org/0000-0003-2861-8438"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Li Xiao","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043923522","display_name":"Eric J. Hunter","orcid":"https://orcid.org/0000-0001-5571-464X"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eric J. Hunter","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5035545617"],"corresponding_institution_ids":["https://openalex.org/I87216513"],"apc_list":null,"apc_paid":null,"fwci":0.525,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.62078652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1019","last_page":"1033"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8573082685470581},{"id":"https://openalex.org/keywords/spoofing-attack","display_name":"Spoofing attack","score":0.826370358467102},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5686855316162109},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5591306686401367},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5455309152603149},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5081872940063477},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.43882206082344055},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42022591829299927},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.13261577486991882},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.11192536354064941}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8573082685470581},{"id":"https://openalex.org/C167900197","wikidata":"https://www.wikidata.org/wiki/Q11081100","display_name":"Spoofing attack","level":2,"score":0.826370358467102},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5686855316162109},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5591306686401367},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5455309152603149},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5081872940063477},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.43882206082344055},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42022591829299927},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.13261577486991882},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.11192536354064941},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3488932.3517420","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3488932.3517420","pdf_url":null,"source":{"id":"https://openalex.org/S4363609011","display_name":"Proceedings of the 2022 ACM on Asia Conference on Computer and Communications Security","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 ACM on Asia Conference on Computer and Communications Security","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7099999785423279,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G3652504997","display_name":null,"funder_award_id":"R01DC012315","funder_id":"https://openalex.org/F4320337352","funder_display_name":"National Institute on Deafness and Other Communication Disorders"},{"id":"https://openalex.org/G4242031410","display_name":null,"funder_award_id":"CNS-1950171; CCF-2007159","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337352","display_name":"National Institute on Deafness and Other Communication Disorders","ror":"https://ror.org/04mhx6838"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W84813673","https://openalex.org/W1542280630","https://openalex.org/W1558698732","https://openalex.org/W1635512741","https://openalex.org/W1849277567","https://openalex.org/W1984849881","https://openalex.org/W2000667994","https://openalex.org/W2002123483","https://openalex.org/W2062703747","https://openalex.org/W2064364374","https://openalex.org/W2097117768","https://openalex.org/W2111491793","https://openalex.org/W2114925438","https://openalex.org/W2123299109","https://openalex.org/W2133895428","https://openalex.org/W2147147599","https://openalex.org/W2150769028","https://openalex.org/W2169879729","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2398826216","https://openalex.org/W2472787443","https://openalex.org/W2536166232","https://openalex.org/W2575585029","https://openalex.org/W2624801495","https://openalex.org/W2745896134","https://openalex.org/W2747024632","https://openalex.org/W2748488820","https://openalex.org/W2765636281","https://openalex.org/W2809536883","https://openalex.org/W2888955371","https://openalex.org/W2962788625","https://openalex.org/W2964052309","https://openalex.org/W2974062151","https://openalex.org/W2981087920","https://openalex.org/W2984998244","https://openalex.org/W4300824008"],"related_works":["https://openalex.org/W1977167953","https://openalex.org/W2954943288","https://openalex.org/W107154053","https://openalex.org/W4255044973","https://openalex.org/W2499802997","https://openalex.org/W2112059504","https://openalex.org/W2727729836","https://openalex.org/W1960256358","https://openalex.org/W2464377622","https://openalex.org/W2394963835"],"abstract_inverted_index":{"Voice-activated":[0],"systems":[1,236],"are":[2,193],"integrated":[3],"into":[4],"a":[5,32,78,126,133,138,153,171],"variety":[6],"of":[7,31,60,81,90,121,159,233],"desktop,":[8],"mobile,":[9],"and":[10,21,119,187,207],"Internet-of-Things":[11],"(IoT)":[12],"devices.":[13],"However,":[14,63],"voice":[15,30,61,83,162,174],"spoofing":[16],"attacks,":[17,23],"such":[18],"as":[19],"impersonation":[20],"replay":[22,36,269],"in":[24,221,267,284],"which":[25,226],"malicious":[26],"attackers":[27],"synthesize":[28],"the":[29,51,87,94,102,117,149,190,222,228,234],"victim":[33],"or":[34],"simply":[35],"it,":[37],"have":[38,66],"brought":[39],"growing":[40],"security":[41,118],"concerns.":[42],"Existing":[43],"speaker":[44,122,127,145,223,252],"verification":[45,128,224,253],"techniques":[46],"distinguish":[47],"individual":[48],"speakers":[49],"via":[50],"spectrographic":[52],"features":[53],"extracted":[54],"from":[55,109,164,195],"an":[56,208,246,289],"audible":[57],"frequency":[58,96],"range":[59],"commands.":[62],"they":[64],"often":[65],"high":[67],"error":[68,219,231,265],"rates":[69],"and/or":[70],"long":[71],"delays.":[72],"In":[73,167,180],"this":[74],"paper,":[75],"we":[76,151,169,277],"explore":[77],"new":[79],"direction":[80],"human":[82,91],"research":[84,99],"by":[85,199,237,272,287],"scrutinizing":[86],"unique":[88],"characteristics":[89],"speech":[92,107,154],"at":[93],"ultrasound":[95,104,209,291],"band.":[97],"Our":[98,211],"indicates":[100],"that":[101,131,214,279],"high-frequency":[103],"components":[105],"(e.g.":[106],"fricatives)":[108],"20":[110],"to":[111,142,176,182],"48":[112],"kHz":[113],"can":[114,281],"significantly":[115],"enhance":[116],"accuracy":[120],"verification.":[123],"We":[124],"propose":[125],"system,":[129,150],"SUPERVOICE":[130,215,239,261,280],"uses":[132],"two-stream":[134],"DNN":[135],"architecture":[136],"with":[137,156],"feature":[139],"fusion":[140],"mechanism":[141],"generate":[143],"distinctive":[144],"models.":[146],"To":[147],"test":[148],"create":[152,170],"dataset":[155,175],"12":[157],"hours":[158],"audio":[160,191],"(8,950":[161],"samples)":[163],"127":[165],"participants.":[166],"addition,":[168],"second":[172],"spoofed":[173],"evaluate":[177],"its":[178],"security.":[179],"order":[181],"balance":[183],"between":[184],"controlled":[185],"recordings":[186,192],"real-world":[188],"applications,":[189],"collected":[194],"two":[196],"quiet":[197],"rooms":[198],"8":[200],"different":[201,274],"recording":[202],"devices,":[203],"including":[204],"7":[205],"smartphones":[206,286],"microphone.":[210,292],"evaluation":[212],"shows":[213],"achieves":[216,262],"0.58%":[217],"equal":[218,230,264],"rate":[220,232,266],"task,":[225],"reduces":[227],"best":[229],"existing":[235,251],"86.1%.":[238],"only":[240],"takes":[241],"120":[242],"ms":[243,258],"for":[244],"testing":[245],"incoming":[247],"utterance,":[248],"outperforming":[249],"all":[250],"systems.":[254],"Moreover,":[255],"within":[256],"91":[257],"processing":[259],"time,":[260],"0%":[263],"detecting":[268],"attacks":[270],"launched":[271],"5":[273],"loudspeakers.":[275],"Finally,":[276],"demonstrate":[278],"be":[282],"used":[283],"retail":[285],"integrating":[288],"off-the-shelf":[290]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2022-05-25T00:00:00"}
