{"id":"https://openalex.org/W4392411893","doi":"https://doi.org/10.1109/ijcb57857.2023.10449121","title":"SV-DeiT: Speaker Verification with DeiTCap Spoofing Detection","display_name":"SV-DeiT: Speaker Verification with DeiTCap Spoofing Detection","publication_year":2023,"publication_date":"2023-09-25","ids":{"openalex":"https://openalex.org/W4392411893","doi":"https://doi.org/10.1109/ijcb57857.2023.10449121"},"language":"en","primary_location":{"id":"doi:10.1109/ijcb57857.2023.10449121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcb57857.2023.10449121","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Joint Conference on Biometrics (IJCB)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110852852","display_name":"Rishabh Ranjan","orcid":null},"institutions":[{"id":"https://openalex.org/I154549908","display_name":"Indian Institute of Technology Jodhpur","ror":"https://ror.org/03yacj906","country_code":"IN","type":"education","lineage":["https://openalex.org/I154549908"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rishabh Ranjan","raw_affiliation_strings":["Indian Institute of Technology, Jodhpur,Jodhpur,India","Indian Institute of Technology, Jodhpur, Jodhpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur,Jodhpur,India","institution_ids":["https://openalex.org/I154549908"]},{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur, Jodhpur, India","institution_ids":["https://openalex.org/I154549908"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050521702","display_name":"Mayank Vatsa","orcid":"https://orcid.org/0000-0001-5952-2274"},"institutions":[{"id":"https://openalex.org/I154549908","display_name":"Indian Institute of Technology Jodhpur","ror":"https://ror.org/03yacj906","country_code":"IN","type":"education","lineage":["https://openalex.org/I154549908"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Mayank Vatsa","raw_affiliation_strings":["Indian Institute of Technology, Jodhpur,Jodhpur,India","Indian Institute of Technology, Jodhpur, Jodhpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur,Jodhpur,India","institution_ids":["https://openalex.org/I154549908"]},{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur, Jodhpur, India","institution_ids":["https://openalex.org/I154549908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011779957","display_name":"Richa Singh","orcid":"https://orcid.org/0000-0003-4060-4573"},"institutions":[{"id":"https://openalex.org/I154549908","display_name":"Indian Institute of Technology Jodhpur","ror":"https://ror.org/03yacj906","country_code":"IN","type":"education","lineage":["https://openalex.org/I154549908"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Richa Singh","raw_affiliation_strings":["Indian Institute of Technology, Jodhpur,Jodhpur,India","Indian Institute of Technology, Jodhpur, Jodhpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur,Jodhpur,India","institution_ids":["https://openalex.org/I154549908"]},{"raw_affiliation_string":"Indian Institute of Technology, Jodhpur, Jodhpur, India","institution_ids":["https://openalex.org/I154549908"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110852852"],"corresponding_institution_ids":["https://openalex.org/I154549908"],"apc_list":null,"apc_paid":null,"fwci":0.3491,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.6822307,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.8083373308181763},{"id":"https://openalex.org/keywords/spoofing-attack","display_name":"Spoofing attack","score":0.7570198774337769},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7342058420181274},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.49639326333999634},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.41452130675315857},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.21385008096694946}],"concepts":[{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.8083373308181763},{"id":"https://openalex.org/C167900197","wikidata":"https://www.wikidata.org/wiki/Q11081100","display_name":"Spoofing attack","level":2,"score":0.7570198774337769},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7342058420181274},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.49639326333999634},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41452130675315857},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.21385008096694946}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcb57857.2023.10449121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcb57857.2023.10449121","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Joint Conference on Biometrics (IJCB)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1638038541","https://openalex.org/W2108598243","https://openalex.org/W2138878452","https://openalex.org/W2295634712","https://openalex.org/W2401839215","https://openalex.org/W2403139431","https://openalex.org/W2560674852","https://openalex.org/W2593116425","https://openalex.org/W2602814339","https://openalex.org/W2740489634","https://openalex.org/W2912083425","https://openalex.org/W2936802426","https://openalex.org/W2967606780","https://openalex.org/W2972786657","https://openalex.org/W2973181078","https://openalex.org/W2999174651","https://openalex.org/W3024920698","https://openalex.org/W3094502228","https://openalex.org/W3126967250","https://openalex.org/W3127781933","https://openalex.org/W3158663310","https://openalex.org/W3160325739","https://openalex.org/W3163596559","https://openalex.org/W3175036090","https://openalex.org/W3196974791","https://openalex.org/W3198329097","https://openalex.org/W3200167423","https://openalex.org/W3201773091","https://openalex.org/W3213618310","https://openalex.org/W4281847696","https://openalex.org/W4297841768","https://openalex.org/W4317181815","https://openalex.org/W4372260474","https://openalex.org/W4385763728","https://openalex.org/W6739901393","https://openalex.org/W6743446608","https://openalex.org/W6788135285","https://openalex.org/W6795261426","https://openalex.org/W6838910450"],"related_works":["https://openalex.org/W4294437891","https://openalex.org/W4226389478","https://openalex.org/W4297792928","https://openalex.org/W4221161333","https://openalex.org/W3113108043","https://openalex.org/W2061278248","https://openalex.org/W4298202768","https://openalex.org/W1914348842","https://openalex.org/W1516392727","https://openalex.org/W2140022733"],"abstract_inverted_index":{"As":[0],"advancements":[1],"in":[2,55,77,150],"automatic":[3],"speech":[4],"generation":[5],"continue":[6],"to":[7,11,27,86,120],"progress,":[8],"the":[9,48,61,78,98,122,136,140,145],"ability":[10],"distinguish":[12],"between":[13],"real":[14],"and":[15,32,52,81,117,160],"fake":[16],"samples":[17],"has":[18],"diminished.":[19],"In":[20],"addition,":[21],"current":[22],"spoofing":[23,99],"detection":[24,64,93],"algorithms":[25],"struggle":[26],"perform":[28],"well":[29],"on":[30,66,135],"new":[31],"unseen":[33],"test":[34],"distributions.":[35],"To":[36],"address":[37],"these":[38],"challenges,":[39],"this":[40],"paper":[41],"presents":[42],"two":[43,154],"contributions.":[44],"First,":[45],"inspired":[46],"by":[47],"success":[49],"of":[50,124,133,139],"transformer":[51],"capsule":[53,88],"networks":[54],"high":[56],"representation":[57],"capabilities,":[58],"we":[59,106],"propose":[60],"DeiTCap":[62],"spoof":[63,92],"network":[65,147],"spectrogram":[67],"audio":[68,79],"features.":[69],"This":[70],"framework":[71,103],"utilizes":[72],"multi-head":[73],"attention,":[74],"sub-entities":[75],"(capsules)":[76],"domain":[80],"a":[82,108],"modified":[83],"routing":[84],"algorithm":[85,94],"identify":[87],"agreement.":[89],"The":[90],"proposed":[91,128,146],"is":[95],"integrated":[96],"into":[97],"aware":[100],"speaker":[101],"recognition":[102],"SV-DeiT.":[104],"Second,":[105],"introduce":[107],"novel":[109],"text-to-speech":[110],"dataset":[111],"TRADIF":[112],"created":[113],"with":[114,153],"cutting-edge":[115],"transformers":[116],"diffusion":[118],"models":[119],"evaluate":[121],"generalizability":[123],"countermeasure":[125],"systems.":[126],"Our":[127],"DeiT-Cap":[129],"achieves":[130],"an":[131],"EER":[132],"1.08%":[134],"evaluation":[137],"set":[138],"ASVSpoof2019":[141],"LA":[142],"dataset.":[143],"Moreover,":[144],"demonstrates":[148],"strength":[149],"cross-domain":[151],"training-testing":[152],"different":[155],"datasets,":[156],"highlighting":[157],"its":[158],"robustness":[159],"versatility.":[161]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
