{"id":"https://openalex.org/W4388116228","doi":"https://doi.org/10.1109/isi58743.2023.10297267","title":"Learning to Listen and Listening to Learn: Spoofed Audio Detection Through Linguistic Data Augmentation","display_name":"Learning to Listen and Listening to Learn: Spoofed Audio Detection Through Linguistic Data Augmentation","publication_year":2023,"publication_date":"2023-10-02","ids":{"openalex":"https://openalex.org/W4388116228","doi":"https://doi.org/10.1109/isi58743.2023.10297267"},"language":"en","primary_location":{"id":"doi:10.1109/isi58743.2023.10297267","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isi58743.2023.10297267","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Intelligence and Security Informatics (ISI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025228118","display_name":"Zahra Khanjani","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zahra Khanjani","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111878160","display_name":"L.S. Davis","orcid":"https://orcid.org/0009-0001-1414-8415"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lavon Davis","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003143459","display_name":"Anna Tuz","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anna Tuz","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kifekachukwu Nwosu","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kifekachukwu Nwosu","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047324018","display_name":"Christine Mallinson","orcid":"https://orcid.org/0000-0002-8988-5399"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christine Mallinson","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063541070","display_name":"Vandana P. Janeja","orcid":"https://orcid.org/0000-0003-0130-6135"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vandana P. Janeja","raw_affiliation_strings":["University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5025228118"],"corresponding_institution_ids":["https://openalex.org/I66946132"],"apc_list":null,"apc_paid":null,"fwci":0.7087,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76729145,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"01","last_page":"06"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9807000160217285,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spoofing-attack","display_name":"Spoofing attack","score":0.8684401512145996},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7778153419494629},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5393616557121277},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.5152526497840881},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46398189663887024},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3573419153690338},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.23605570197105408},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.21166002750396729},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.11055117845535278}],"concepts":[{"id":"https://openalex.org/C167900197","wikidata":"https://www.wikidata.org/wiki/Q11081100","display_name":"Spoofing attack","level":2,"score":0.8684401512145996},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7778153419494629},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5393616557121277},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.5152526497840881},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46398189663887024},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3573419153690338},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.23605570197105408},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.21166002750396729},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.11055117845535278}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isi58743.2023.10297267","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isi58743.2023.10297267","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Intelligence and Security Informatics (ISI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6700000166893005,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G5864374203","display_name":null,"funder_award_id":"2210011","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2176804518","https://openalex.org/W2295634712","https://openalex.org/W2497227373","https://openalex.org/W2519091744","https://openalex.org/W2588445447","https://openalex.org/W2747872086","https://openalex.org/W2911227954","https://openalex.org/W2955054437","https://openalex.org/W2972811785","https://openalex.org/W2989571531","https://openalex.org/W3024920698","https://openalex.org/W3026777299","https://openalex.org/W3093077017","https://openalex.org/W3144417991","https://openalex.org/W3197358873","https://openalex.org/W3198329097","https://openalex.org/W3213515747","https://openalex.org/W4225420087","https://openalex.org/W4226246616","https://openalex.org/W4236097868","https://openalex.org/W4313984387","https://openalex.org/W6799089041","https://openalex.org/W6804283585","https://openalex.org/W6849117450"],"related_works":["https://openalex.org/W2998478967","https://openalex.org/W2188559950","https://openalex.org/W2989910292","https://openalex.org/W3128793638","https://openalex.org/W2607818178","https://openalex.org/W2123299109","https://openalex.org/W2021230337","https://openalex.org/W3153057489","https://openalex.org/W2895823926","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Spoofed":[0],"audio,":[1],"both":[2,107,158],"human":[3,189],"or":[4],"machine":[5],"generated,":[6],"causes":[7],"deception":[8],"and":[9,11,54,72,113,125,161,168],"disinformation":[10],"as":[12,185],"such":[13],"is":[14],"a":[15,27,64,186,203],"societal":[16],"challenge.":[17],"This":[18],"study":[19],"advances":[20],"the":[21,60,109,114,121,142,150,159,165,174],"detection":[22,94,155],"of":[23,63,66,134,152,177,188],"spoofed":[24,92,122,135,153,196,215],"audio":[25,34,45,52,93,110,123,136,143,154,179,197,211,216],"through":[26],"novel":[28],"approach":[29],"that":[30,75,140],"augments":[31],"knowledge":[32],"about":[33],"data":[35,111,144,180],"by":[36],"incorporating":[37],"linguistic":[38,147,183,207],"information.":[39],"Using":[40],"perceptual":[41,182],"methods,":[42],"for":[43,51,195,205,213],"English":[44],"samples,":[46,68],"experts":[47],"in":[48,78,90,157],"sociolinguistics":[49],"listened":[50],"cues,":[53],"used":[55,89],"binary":[56],"labels":[57],"to":[58,96,119,126,191],"indicate":[59,173],"perceived":[61],"authenticity":[62],"set":[65],"speech":[67],"based":[69,103],"on":[70,104,209],"phonetic":[71],"phonological":[73],"features":[74,106,200],"occur":[76],"frequently":[77],"spoken":[79],"English.":[80],"These":[81,199],"Expert":[82],"Defined":[83],"Linguistic":[84],"Features":[85],"(EDLFs)":[86],"were":[87],"then":[88],"supervised":[91],"methods":[95,133],"augment":[97],"AI":[98],"models.":[99,170],"An":[100],"ensemble":[101,169],"method":[102,187],"multi-domain":[105],"from":[108],"itself":[112],"EDLFs":[115,129],"was":[116],"also":[117,201],"created":[118],"evaluate":[120],"detection,":[124],"demonstrate":[127],"how":[128],"can":[130],"improve":[131],"traditional":[132],"detection.":[137,198,217],"We":[138],"found":[139],"augmenting":[141,178],"with":[145,181],"expertinformed":[146],"annotation":[148],"increased":[149],"accuracy":[151],"significantly":[156],"training":[160],"testing":[162],"datasets":[163],"across":[164],"evaluated":[166],"single":[167],"Our":[171],"findings":[172],"promising":[175],"avenue":[176],"techniques,":[184],"discernment,":[190],"enhance":[192],"AI-based":[193],"approaches":[194],"establish":[202],"foundation":[204],"direct":[206],"annotations":[208],"new":[210],"clips":[212],"robust":[214]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-10-10T00:00:00"}
