{"id":"https://openalex.org/W4414945404","doi":"https://doi.org/10.1145/3746265.3759665","title":"VAD-Lip: Visual and Audio Deepfake Detection via Lip Features","display_name":"VAD-Lip: Visual and Audio Deepfake Detection via Lip Features","publication_year":2025,"publication_date":"2025-10-08","ids":{"openalex":"https://openalex.org/W4414945404","doi":"https://doi.org/10.1145/3746265.3759665"},"language":"en","primary_location":{"id":"doi:10.1145/3746265.3759665","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746265.3759665","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st on Deepfake Forensics Workshop: Detection, Attribution, Recognition, and Adversarial Challenges in the Era of AI-Generated Media","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746265.3759665","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102734612","display_name":"Jinyu Wang","orcid":"https://orcid.org/0009-0000-0974-3191"},"institutions":[{"id":"https://openalex.org/I202334528","display_name":"Beijing Electronic Science and Technology Institute","ror":"https://ror.org/01xdzh226","country_code":"CN","type":"education","lineage":["https://openalex.org/I202334528"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"JinYu Wang","raw_affiliation_strings":["Beijing Electronic Science and Technology Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Electronic Science and Technology Institute, Beijing, China","institution_ids":["https://openalex.org/I202334528"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100641352","display_name":"Xin Jin","orcid":"https://orcid.org/0000-0003-3873-1653"},"institutions":[{"id":"https://openalex.org/I202334528","display_name":"Beijing Electronic Science and Technology Institute","ror":"https://ror.org/01xdzh226","country_code":"CN","type":"education","lineage":["https://openalex.org/I202334528"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Jin","raw_affiliation_strings":["Cyber Security, Beijing Electronic Science and Technology Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Cyber Security, Beijing Electronic Science and Technology Institute, Beijing, China","institution_ids":["https://openalex.org/I202334528"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043865759","display_name":"Huaye Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I202334528","display_name":"Beijing Electronic Science and Technology Institute","ror":"https://ror.org/01xdzh226","country_code":"CN","type":"education","lineage":["https://openalex.org/I202334528"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaye Wang","raw_affiliation_strings":["Beijing Electronic Science and Technology Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Electronic Science and Technology Institute, Beijing, China","institution_ids":["https://openalex.org/I202334528"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114094160","display_name":"Longteng Jiang","orcid":"https://orcid.org/0009-0007-5434-9573"},"institutions":[{"id":"https://openalex.org/I202334528","display_name":"Beijing Electronic Science and Technology Institute","ror":"https://ror.org/01xdzh226","country_code":"CN","type":"education","lineage":["https://openalex.org/I202334528"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longteng Jiang","raw_affiliation_strings":["Beijing Electronic Science and Technology Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Electronic Science and Technology Institute, Beijing, China","institution_ids":["https://openalex.org/I202334528"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102734612"],"corresponding_institution_ids":["https://openalex.org/I202334528"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36482444,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"110","last_page":"117"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9509999752044678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6144999861717224},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5870000123977661},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.539900004863739},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.4749999940395355},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.391400009393692},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.3693999946117401}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7939000129699707},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6144999861717224},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5870000123977661},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5464000105857849},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.539900004863739},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.4749999940395355},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.3693999946117401},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36169999837875366},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35089999437332153},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32910001277923584},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.322299987077713},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2976999878883362},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.27709999680519104},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.26649999618530273},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.2535000145435333}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746265.3759665","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746265.3759665","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st on Deepfake Forensics Workshop: Detection, Attribution, Recognition, and Adversarial Challenges in the Era of AI-Generated Media","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3746265.3759665","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746265.3759665","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st on Deepfake Forensics Workshop: Detection, Attribution, Recognition, and Adversarial Challenges in the Era of AI-Generated Media","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2531409750","https://openalex.org/W2551572271","https://openalex.org/W2734984521","https://openalex.org/W2757143884","https://openalex.org/W2891145043","https://openalex.org/W2962958939","https://openalex.org/W2982058372","https://openalex.org/W3034552680","https://openalex.org/W3034713808","https://openalex.org/W3034900344","https://openalex.org/W3081492798","https://openalex.org/W3092879151","https://openalex.org/W3093010840","https://openalex.org/W3093077034","https://openalex.org/W3101631197","https://openalex.org/W3120371271","https://openalex.org/W3178572954","https://openalex.org/W3204893173","https://openalex.org/W4214691743","https://openalex.org/W4319978495","https://openalex.org/W4360993864","https://openalex.org/W4409369524"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,27,39,89,140,164,183],"widespread":[2],"adoption":[3],"of":[4,23,29,41,73,172,177,195],"internet":[5],"technology":[6,31],"and":[7,50,67,95,104,116,128,155,174,186,198],"smart":[8],"devices,":[9],"video":[10],"has":[11,32],"become":[12],"a":[13,83,97],"key":[14],"medium":[15],"for":[16,44,120,147,158],"information":[17],"dissemination,":[18],"permeating":[19],"nearly":[20],"every":[21],"aspect":[22],"social":[24,35,51,56],"life.":[25],"However,":[26],"misuse":[28],"deepfake":[30,100,122],"raised":[33],"several":[34],"issues,":[36],"such":[37],"as":[38],"creation":[40],"fake":[42],"videos":[43,123],"manipulating":[45],"public":[46],"opinion,":[47],"financial":[48],"fraud,":[49],"engineering":[52],"attacks,":[53],"severely":[54],"disrupting":[55],"order.":[57],"Existing":[58],"studies":[59],"primarily":[60],"focus":[61],"on":[62],"pure":[63],"visual":[64,115],"feature":[65],"analysis":[66],"multimodal":[68,99],"detection":[69,72,101,145],"methods,":[70],"but":[71],"audio-video":[74,148],"desynchronization":[75],"forgery":[76,87],"remains":[77],"relatively":[78],"underexplored.":[79],"This":[80],"study":[81],"proposes":[82],"new":[84,152],"large-scale":[85],"audiovisual":[86,129],"dataset,":[88,166],"Audio-Video":[90],"Lip-sync":[91],"Forged":[92],"Dataset":[93],"(AVLiFD),":[94],"introduces":[96],"novel":[98],"method,":[102],"Visual":[103],"Audio":[105],"Deepfake":[106],"Detection":[107],"via":[108],"Lip":[109],"Features":[110],"(VAD-Lip).":[111],"The":[112],"method":[113,142],"combines":[114],"audio":[117],"features":[118],"specifically":[119],"detecting":[121],"forged":[124],"through":[125],"audio,":[126],"video,":[127],"joint":[130,149],"manipulation":[131],"leading":[132],"to":[133],"audio-visual":[134],"desynchronization.":[135],"Experimental":[136],"results":[137],"demonstrate":[138],"that":[139],"proposed":[141],"achieves":[143],"high":[144,192],"accuracy":[146,171,193],"forgery,":[150],"providing":[151],"data":[153],"support":[154],"technical":[156],"solutions":[157],"research":[159],"in":[160],"this":[161],"area.":[162],"On":[163,182],"AVLiFD":[165],"our":[167],"model":[168],"achieved":[169,191],"an":[170,175],"92.50%":[173],"AUC":[176],"0.9518,":[178],"outperforming":[179],"other":[180],"models.":[181],"Celeb-DF,":[184],"FF++,":[185],"DFDC":[187],"datasets,":[188],"it":[189],"also":[190],"rates":[194],"94.67%,":[196],"93.67%,":[197],"92.80%,":[199],"respectively.":[200]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
