{"id":"https://openalex.org/W4224932929","doi":"https://doi.org/10.1109/icassp43922.2022.9747605","title":"Fake Audio Detection Based On Unsupervised Pretraining Models","display_name":"Fake Audio Detection Based On Unsupervised Pretraining Models","publication_year":2022,"publication_date":"2022-04-27","ids":{"openalex":"https://openalex.org/W4224932929","doi":"https://doi.org/10.1109/icassp43922.2022.9747605"},"language":"en","primary_location":{"id":"doi:10.1109/icassp43922.2022.9747605","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747605","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033243530","display_name":"Zhiqiang Lv","orcid":"https://orcid.org/0000-0002-3071-160X"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiqiang Lv","raw_affiliation_strings":["TEG AI, Tencent Inc,Beijing,China,100193"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TEG AI, Tencent Inc,Beijing,China,100193","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100412142","display_name":"Shanshan Zhang","orcid":"https://orcid.org/0000-0003-4013-6300"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shanshan Zhang","raw_affiliation_strings":["TEG AI, Tencent Inc,Beijing,China,100193"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TEG AI, Tencent Inc,Beijing,China,100193","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012291253","display_name":"Kai Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Tang","raw_affiliation_strings":["TEG AI, Tencent Inc,Beijing,China,100193"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TEG AI, Tencent Inc,Beijing,China,100193","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100703624","display_name":"Pengfei Hu","orcid":"https://orcid.org/0009-0000-4537-6288"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengfei Hu","raw_affiliation_strings":["TEG AI, Tencent Inc,Beijing,China,100193"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TEG AI, Tencent Inc,Beijing,China,100193","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5033243530"],"corresponding_institution_ids":["https://openalex.org/I2250653659"],"apc_list":null,"apc_paid":null,"fwci":6.1744,"has_fulltext":false,"cited_by_count":54,"citation_normalized_percentile":{"value":0.97670759,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"9231","last_page":"9235"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7998613119125366},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.6094365119934082},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5166400074958801},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.5042024850845337},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.500030517578125},{"id":"https://openalex.org/keywords/audio-analyzer","display_name":"Audio analyzer","score":0.49721506237983704},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.41869205236434937},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.335286021232605},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.18786463141441345},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.0979863703250885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7998613119125366},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.6094365119934082},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5166400074958801},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.5042024850845337},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.500030517578125},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.49721506237983704},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.41869205236434937},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.335286021232605},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.18786463141441345},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.0979863703250885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp43922.2022.9747605","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747605","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W2295634712","https://openalex.org/W2303197844","https://openalex.org/W2483721152","https://openalex.org/W2752782242","https://openalex.org/W2806569010","https://openalex.org/W2890964092","https://openalex.org/W2922490899","https://openalex.org/W2946508582","https://openalex.org/W2972703466","https://openalex.org/W2979373447","https://openalex.org/W2990833974","https://openalex.org/W2991187463","https://openalex.org/W3007151378","https://openalex.org/W3024869864","https://openalex.org/W3036601975","https://openalex.org/W3163596559","https://openalex.org/W3196514189","https://openalex.org/W3196774886","https://openalex.org/W3197580070","https://openalex.org/W3198329097","https://openalex.org/W3199131409","https://openalex.org/W3199161700","https://openalex.org/W3199956586","https://openalex.org/W3200167423","https://openalex.org/W3201016147","https://openalex.org/W3201197228","https://openalex.org/W3201397251","https://openalex.org/W3209984917","https://openalex.org/W3213029956","https://openalex.org/W4221138880","https://openalex.org/W6777437564","https://openalex.org/W6780218876","https://openalex.org/W6799158992","https://openalex.org/W6802012496","https://openalex.org/W6803164887","https://openalex.org/W6804030475"],"related_works":["https://openalex.org/W2098934641","https://openalex.org/W1996547972","https://openalex.org/W1975359510","https://openalex.org/W4214771044","https://openalex.org/W4387698063","https://openalex.org/W4382560817","https://openalex.org/W1611900921","https://openalex.org/W2766269877","https://openalex.org/W2363106653","https://openalex.org/W2153669644"],"abstract_inverted_index":{"This":[0],"work":[1],"presents":[2],"our":[3,80,93],"systems":[4],"for":[5,52,60,98],"the":[6,13,85],"ADD2022":[7,10],"challenge.":[8],"The":[9],"challenge":[11],"is":[12],"first":[14,83],"audio":[15,39,54,63,68,78,101],"deep":[16],"synthesis":[17],"detection":[18,40,64,69],"challenge,":[19],"which":[20],"aims":[21],"to":[22,36],"spot":[23],"various":[24],"kinds":[25],"of":[26],"fake":[27,38,53,62,67,77,100],"audios.":[28],"We":[29],"have":[30],"explored":[31],"using":[32],"unsupervised":[33,45],"pretraining":[34,46],"models":[35,47],"build":[37],"systems.":[41],"Results":[42],"indicate":[43],"that":[44],"can":[48],"achieve":[49],"excellent":[50],"performance":[51],"detection.":[55,102],"Our":[56],"final":[57],"EER":[58],"results":[59,81],"low-quality":[61],"and":[65,72],"partially":[66,76,99],"are":[70],"32.80%":[71],"4.80%":[73],"relatively.":[74],"For":[75],"detection,":[79],"ranked":[82],"in":[84],"competition.":[86],"Even":[87],"trained":[88],"with":[89],"totally":[90],"mismatched":[91],"data,":[92],"method":[94],"still":[95],"generalizes":[96],"well":[97]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":5}],"updated_date":"2026-05-22T09:01:20.584952","created_date":"2025-10-10T00:00:00"}
