{"id":"https://openalex.org/W2740489634","doi":"https://doi.org/10.1109/taslp.2017.2732162","title":"Deep Feature Engineering for Noise Robust Spoofing Detection","display_name":"Deep Feature Engineering for Noise Robust Spoofing Detection","publication_year":2017,"publication_date":"2017-07-26","ids":{"openalex":"https://openalex.org/W2740489634","doi":"https://doi.org/10.1109/taslp.2017.2732162","mag":"2740489634"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2017.2732162","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2732162","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100341993","display_name":"Yanmin Qian","orcid":"https://orcid.org/0000-0002-0314-3790"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanmin Qian","raw_affiliation_strings":["Computer Science and Engineering Department, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Department, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071702566","display_name":"Nanxin Chen","orcid":"https://orcid.org/0000-0001-6698-1604"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nanxin Chen","raw_affiliation_strings":["Center for Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA"],"affiliations":[{"raw_affiliation_string":"Center for Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080154283","display_name":"Heinrich Dinkel","orcid":"https://orcid.org/0000-0003-4330-8980"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heinrich Dinkel","raw_affiliation_strings":["Computer Science and Engineering Department, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering Department, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102765381","display_name":"Zhizheng Wu","orcid":"https://orcid.org/0009-0001-1192-9857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhizheng Wu","raw_affiliation_strings":["Centre for Speech Technology Research, University of Edinburgh, Cupertino, CA, USA"],"affiliations":[{"raw_affiliation_string":"Centre for Speech Technology Research, University of Edinburgh, Cupertino, CA, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100341993"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":3.1385,"has_fulltext":false,"cited_by_count":44,"citation_normalized_percentile":{"value":0.93424752,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"25","issue":"10","first_page":"1942","last_page":"1955"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.960099995136261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.9056674838066101},{"id":"https://openalex.org/keywords/spoofing-attack","display_name":"Spoofing attack","score":0.8959808349609375},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8100656270980835},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7944561243057251},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6861558556556702},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.6653389930725098},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6543025970458984},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6112675666809082},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5968836545944214},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5955543518066406},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.563231348991394},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47334885597229004},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.47282135486602783},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4223010540008545},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38699308037757874},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.08081504702568054}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.9056674838066101},{"id":"https://openalex.org/C167900197","wikidata":"https://www.wikidata.org/wiki/Q11081100","display_name":"Spoofing attack","level":2,"score":0.8959808349609375},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8100656270980835},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7944561243057251},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6861558556556702},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.6653389930725098},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6543025970458984},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6112675666809082},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5968836545944214},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5955543518066406},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.563231348991394},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47334885597229004},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.47282135486602783},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4223010540008545},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38699308037757874},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.08081504702568054},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2017.2732162","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2732162","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7200000286102295,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G2368558818","display_name":null,"funder_award_id":"61603252","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5039175848","display_name":null,"funder_award_id":"61573241","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W11511395","https://openalex.org/W129770839","https://openalex.org/W1006777433","https://openalex.org/W1490120479","https://openalex.org/W1522301498","https://openalex.org/W1566256432","https://openalex.org/W1904365287","https://openalex.org/W1974387177","https://openalex.org/W1979482308","https://openalex.org/W1992475611","https://openalex.org/W2012897754","https://openalex.org/W2028706510","https://openalex.org/W2033310064","https://openalex.org/W2046056978","https://openalex.org/W2053019885","https://openalex.org/W2062164080","https://openalex.org/W2062703747","https://openalex.org/W2079735306","https://openalex.org/W2089917322","https://openalex.org/W2114376863","https://openalex.org/W2121061347","https://openalex.org/W2121415728","https://openalex.org/W2123299109","https://openalex.org/W2127982613","https://openalex.org/W2129379984","https://openalex.org/W2131734706","https://openalex.org/W2136439176","https://openalex.org/W2138878452","https://openalex.org/W2150769028","https://openalex.org/W2150962366","https://openalex.org/W2151484683","https://openalex.org/W2160815625","https://openalex.org/W2163922914","https://openalex.org/W2170088868","https://openalex.org/W2176804518","https://openalex.org/W2198724430","https://openalex.org/W2213952365","https://openalex.org/W2270140468","https://openalex.org/W2297648422","https://openalex.org/W2303197844","https://openalex.org/W2394932179","https://openalex.org/W2397947827","https://openalex.org/W2398362606","https://openalex.org/W2398758564","https://openalex.org/W2401315748","https://openalex.org/W2401657728","https://openalex.org/W2401839215","https://openalex.org/W2402195372","https://openalex.org/W2402922286","https://openalex.org/W2405506115","https://openalex.org/W2405524873","https://openalex.org/W2406264770","https://openalex.org/W2406778302","https://openalex.org/W2407170210","https://openalex.org/W2483721152","https://openalex.org/W2491899193","https://openalex.org/W2512302098","https://openalex.org/W2515753980","https://openalex.org/W2533075636","https://openalex.org/W2548055032","https://openalex.org/W2576165910","https://openalex.org/W2587717635","https://openalex.org/W6600449757","https://openalex.org/W6605272181","https://openalex.org/W6631190155","https://openalex.org/W6640036494","https://openalex.org/W6685748340","https://openalex.org/W6688428952","https://openalex.org/W6693961328","https://openalex.org/W6711962127","https://openalex.org/W6712660717","https://openalex.org/W6712816420","https://openalex.org/W6712883666","https://openalex.org/W6713214774","https://openalex.org/W6713361921","https://openalex.org/W6713401928","https://openalex.org/W6713566751","https://openalex.org/W6713679595","https://openalex.org/W6729633544"],"related_works":["https://openalex.org/W4298017035","https://openalex.org/W3128220493","https://openalex.org/W2792147139","https://openalex.org/W3110700750","https://openalex.org/W2998675825","https://openalex.org/W4226354336","https://openalex.org/W4394636190","https://openalex.org/W2736804899","https://openalex.org/W2897443685","https://openalex.org/W4307654087"],"abstract_inverted_index":{"Spoofing":[0],"detection":[1,36],"for":[2,74,135,181],"automatic":[3],"speaker":[4],"verification":[5],"(ASV)":[6],"aims":[7],"to":[8,23,62,88,103,112,115,177],"discriminate":[9],"between":[10],"genuine":[11],"and":[12,65,84,99,111,119,126,157,175,179,183],"spoofed":[13],"speech.":[14],"This":[15],"topic":[16],"has":[17,37],"received":[18],"increased":[19],"attentions":[20],"recently":[21],"due":[22],"safety":[24],"concerns":[25],"with":[26],"deploying":[27],"an":[28],"ASV":[29],"system.":[30],"While":[31],"the":[32,46,148,164],"performance":[33,47],"of":[34,147],"spoofing":[35,75,117,136],"improved":[38],"significantly":[39],"in":[40,43,50,57],"clean":[41],"condition":[42],"recent":[44],"studies,":[45],"degrades":[48],"dramatically":[49,167],"noisy":[51,145,156,185],"conditions.":[52],"To":[53],"address":[54],"this":[55,58],"issue,":[56],"paper,":[59],"we":[60,79],"propose":[61],"extract":[63,89],"robust":[64,108],"discriminative":[66,90],"deep":[67,71,81],"features":[68],"by":[69],"using":[70],"learning":[72],"techniques":[73,128],"detection.":[76,137],"In":[77],"particular,":[78],"employ":[80],"feedforward,":[82],"recurrent,":[83],"convolutional":[85],"neural":[86,105,124],"networks":[87,106,125],"features.":[91],"We":[92],"also":[93],"introduce":[94],"multicondition":[95],"training,":[96,98],"noise-aware":[97],"annealed":[100],"dropout":[101],"training":[102,127],"make":[104],"more":[107],"against":[109],"noise":[110,120],"avoid":[113],"overfitting":[114],"specific":[116],"attacks":[118],"types.":[121],"The":[122],"proposed":[123,165],"are":[129],"combined":[130],"into":[131],"a":[132,144],"single":[133],"framework":[134],"Experimental":[138,160],"evaluation":[139],"is":[140],"carried":[141],"out":[142],"on":[143],"version":[146],"standard":[149],"ASVspoof":[150],"2015":[151],"corpus,":[152],"including":[153],"both":[154],"additive":[155],"reverberant":[158],"scenarios.":[159],"results":[161],"confirm":[162],"that":[163],"system":[166],"decreases":[168],"averaged":[169],"equal":[170],"error":[171],"rates":[172],"from":[173],"19.1%":[174],"22.6%":[176],"3.2%":[178],"5.1%":[180],"seen":[182],"unseen":[184],"conditions,":[186],"respectively.":[187]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
