{"id":"https://openalex.org/W4403362836","doi":"https://doi.org/10.1109/icassp49660.2025.10890611","title":"Detecting and Defending Against Adversarial Attacks on Automatic Speech Recognition via Diffusion Models","display_name":"Detecting and Defending Against Adversarial Attacks on Automatic Speech Recognition via Diffusion Models","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4403362836","doi":"https://doi.org/10.1109/icassp49660.2025.10890611"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890611","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890611","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2409.07936","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111396335","display_name":"Nikolai Lund K\u00fchne","orcid":null},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Nikolai L. K\u00fchne","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116580508","display_name":"Astrid H. F. Kitchena","orcid":null},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Astrid H. F. Kitchena","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Marie S. Jensen","orcid":null},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Marie S. Jensen","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111396336","display_name":"Mikkel Sebastian Lundsgaard Br\u00f8ndt","orcid":null},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Mikkel S. L. Br\u00f8ndt","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101788847","display_name":"Martin Gonzalez","orcid":"https://orcid.org/0000-0002-1176-2022"},"institutions":[{"id":"https://openalex.org/I3018083178","display_name":"Institut de Recherche Technologique SystemX","ror":"https://ror.org/03crmsn52","country_code":"FR","type":"facility","lineage":["https://openalex.org/I3018083178"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Martin Gonzalez","raw_affiliation_strings":["IRT SystemX,France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IRT SystemX,France","institution_ids":["https://openalex.org/I3018083178"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107409832","display_name":"Christophe A. N. Biscio","orcid":"https://orcid.org/0000-0002-2218-6825"},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Christophe Biscio","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110112480","display_name":"Zheng-Hua Tan","orcid":"https://orcid.org/0000-0002-6855-6852"},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Zheng-Hua Tan","raw_affiliation_strings":["Aalborg University,Denmark"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aalborg University,Denmark","institution_ids":["https://openalex.org/I891191580"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111396335"],"corresponding_institution_ids":["https://openalex.org/I891191580"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00055772,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9772999882698059,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9772999882698059,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9684000015258789,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9631999731063843,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.9321211576461792},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8457820415496826},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5930798053741455},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5389353632926941},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49436450004577637},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.41145631670951843},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3268616497516632}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.9321211576461792},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8457820415496826},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5930798053741455},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5389353632926941},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49436450004577637},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.41145631670951843},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3268616497516632},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890611","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890611","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2409.07936","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.07936","pdf_url":"https://arxiv.org/pdf/2409.07936","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:HAL:hal-04726719v1","is_oa":true,"landing_page_url":"https://hal.science/hal-04726719","pdf_url":"https://hal.science/hal-04726719v1/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), Apr 2025, Hyderabad, India","raw_type":"Conference papers"},{"id":"pmh:oai:pure.atira.dk:publications/56da4472-334e-4c2f-a785-1f3599d111e6","is_oa":true,"landing_page_url":"https://vbn.aau.dk/da/publications/56da4472-334e-4c2f-a785-1f3599d111e6","pdf_url":"https://vbn.aau.dk/ws/files/762629688/2025001486.pdf","source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"K\u00fchne, N L, Kitchen, A H F, Saugstrup Jensen, M, Br\u00f8ndt, M S L, Gonzalez, M, Biscio, C & Tan, Z-H 2025, Detecting and Defending Against Adversarial Attacks on Automatic Speech Recognition via Diffusion Models. in 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE (Institute of Electrical and Electronics Engineers), 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, Hyderabad, India, 06/04/2025. https://doi.org/10.1109/ICASSP49660.2025.10890611","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"doi:10.48550/arxiv.2409.07936","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2409.07936","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2409.07936","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.07936","pdf_url":"https://arxiv.org/pdf/2409.07936","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4403362836.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W2127141656","https://openalex.org/W2180612164","https://openalex.org/W2194775991","https://openalex.org/W2525632221","https://openalex.org/W2906211136","https://openalex.org/W2954930777","https://openalex.org/W2963857521","https://openalex.org/W2964082701","https://openalex.org/W2964301649","https://openalex.org/W2973252307","https://openalex.org/W3015241525","https://openalex.org/W3091896612","https://openalex.org/W3153453329","https://openalex.org/W3156272176","https://openalex.org/W4311424365","https://openalex.org/W4312458120","https://openalex.org/W4328007740","https://openalex.org/W6637162671","https://openalex.org/W6640090968","https://openalex.org/W6640425456","https://openalex.org/W6640963894","https://openalex.org/W6679045638","https://openalex.org/W6739868092","https://openalex.org/W6746295503","https://openalex.org/W6748288002","https://openalex.org/W6754602573","https://openalex.org/W6760326341","https://openalex.org/W6771467084","https://openalex.org/W6779823529","https://openalex.org/W6783182287","https://openalex.org/W6788990321","https://openalex.org/W6791552382","https://openalex.org/W6850532857"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W4246396837","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W4310988119","https://openalex.org/W4285226279","https://openalex.org/W4288019534"],"abstract_inverted_index":{"Automatic":[0],"speech":[1,24],"recognition":[2],"(ASR)":[3],"systems":[4],"are":[5],"known":[6],"to":[7,10,37],"be":[8],"vulnerable":[9],"adversarial":[11,39,89,122,135,151],"attacks.":[12],"This":[13],"paper":[14],"addresses":[15],"detection":[16],"and":[17,93],"defence":[18],"against":[19,88,121],"targeted":[20],"white-box":[21],"attacks":[22,90,123,136,152],"on":[23,70,91,105,124],"signals":[25],"for":[26,50,86,133],"ASR":[27,57],"systems.":[28],"While":[29],"existing":[30],"work":[31],"has":[32],"utilised":[33],"diffusion":[34,68,100,116],"models":[35],"(DMs)":[36],"purify":[38],"examples,":[40],"achieving":[41],"state-of-the-art":[42],"results":[43,144],"in":[44],"keyword":[45],"spotting":[46],"tasks,":[47],"their":[48],"effectiveness":[49],"more":[51],"complex":[52],"tasks":[53],"such":[54],"as":[55],"sentence-level":[56],"remains":[58],"unexplored.":[59],"Additionally,":[60],"the":[61,64,82,95,106],"impact":[62],"of":[63,66,84,97],"number":[65],"forward":[67,99,115],"steps":[69,117],"performance":[71],"is":[72],"not":[73],"well":[74],"understood.":[75],"In":[76],"this":[77,147],"paper,":[78],"we":[79,111,127],"systematically":[80],"investigate":[81],"use":[83],"DMs":[85],"defending":[87],"sentences":[92],"examine":[94],"effect":[96],"varying":[98],"steps.":[101],"Through":[102],"comprehensive":[103],"experiments":[104],"Mozilla":[107],"Common":[108],"Voice":[109],"dataset,":[110],"demonstrate":[112],"that":[113,146],"two":[114],"can":[118,149],"completely":[119],"defend":[120],"sentences.":[125],"Moreover,":[126],"introduce":[128],"a":[129,139],"novel,":[130],"training-free":[131],"approach":[132],"detecting":[134],"by":[137],"leveraging":[138],"pre-trained":[140],"DM.":[141],"Our":[142],"experimental":[143],"show":[145],"method":[148],"detect":[150],"with":[153],"high":[154],"accuracy.":[155]},"counts_by_year":[],"updated_date":"2026-05-15T08:27:34.491423","created_date":"2024-10-13T00:00:00"}
